@inproceedings{701b21bad4b743c995a965dd76764c6a,
title = "InterFormer: Human Interaction Understanding with Deformed Transformer",
abstract = "Human interaction understanding (HIU) is a crucial and challenging problem, which consists of two subtasks: individual action recognition and pairwise interactive recognition. Previous methods do not fully capture the temporal and spatial correlations when understanding human interactions. To alleviate the problem, we decouple HIU into complementary parts for exploring comprehensive correlations among individuals. Especially, we design a multi-branch network, named InterFormer, to jointly model these interactive relations, which contains two parallel encoders to generate spatial and temporal features separately, and Spatial-Temporal Transformers (STTransformer) to exploit spatial and temporal contextual information in a cross-manner. Extensive experiments are conducted on two benchmarks, and the proposed InterFormer achieves state-of-the-art performance on these datasets.",
keywords = "Human interaction, Spatial-temporal features, Transformer",
author = "Di He and Zexing Du and Xue Wang and Qing Wang",
note = "Publisher Copyright: {\textcopyright} 2023, The Author(s), under exclusive license to Springer Nature Singapore Pte Ltd.; 19th International Conference on Intelligent Computing, ICIC 2023 ; Conference date: 10-08-2023 Through 13-08-2023",
year = "2023",
doi = "10.1007/978-981-99-4761-4_17",
language = "英语",
isbn = "9789819947607",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "193--203",
editor = "De-Shuang Huang and Prashan Premaratne and Baohua Jin and Boyang Qu and Kang-Hyun Jo and Abir Hussain",
booktitle = "Advanced Intelligent Computing Technology and Applications - 19th International Conference, ICIC 2023, Proceedings",
}