@inproceedings{65e4ecee9890439888605aa0fe522353,
title = "A dual-stream spatial-temporal detector for action recognition",
abstract = "In response to the issue that existing human action recognition models can not make full use of complementary information from different modalities, this thesis proposes a multi-path attention module MA to form the MA-GCN model. modalities, this thesis proposes a dual-stream human action recognition model SRHAR that fuses skeleton data and RGB data. This model utilizes LAF proposed in this thesis to fuse skeleton features and RGB features. The introduction of skeleton modality enables the RGB modality to obtain the RGB features. The introduction of skeleton modality enables the RGB modality to obtain complementary information, resulting in more accurate prediction results. This algorithm focuses more on recognition accuracy and has a slower recognition speed, but achieves leading performance in terms of accuracy on public datasets.",
keywords = "action recognition, attention mechanism, lightweight",
author = "Pingping Wei and Jiale Li and Peiran Liu and Li Li and Yifei Xu and Ling Wang",
note = "Publisher Copyright: {\textcopyright} 2024 SPIE.; 4th International Conference on Computer Vision and Pattern Analysis, ICCPA 2024 ; Conference date: 17-05-2024 Through 19-05-2024",
year = "2024",
doi = "10.1117/12.3038011",
language = "英语",
series = "Proceedings of SPIE - The International Society for Optical Engineering",
publisher = "SPIE",
editor = "Ji Zhao and Yonghui Yang",
booktitle = "Fourth International Conference on Computer Vision and Pattern Analysis, ICCPA 2024",
}