@inproceedings{1e19ec60bbf241b2bd7c33b4f9909dcb,
title = "Deep selective feature learning for action recognition",
abstract = "Soft-attention mechanism has attracted a lot of attention in recent years due to its ability to capture the most discriminative image features for understanding actions. However, soft-attention tends to focus on fine-grained parts on images and ignores global information, which can lead to totally wrong classification results. To address this issue, we propose a novel deep selective feature learning network (DSFNet), which can automatically learn the feature maps with both fine-grained and global information. Specially, DSFNet is designed to have the ability to learn to adjust the actions for feature map selection by maximizing the cumulative discounted rewards. Moreover, the DSFNet is an easy-to-use extension of state-of-the-art base architectures of multiple tasks. Extensive experiments show that the proposed method has achieved superior performance on two standard action recognition benchmarks across still images (PPMI) and videos (HMDB51).",
keywords = "Action recognition, Feature selection, Reinforcement learning",
author = "Ziqiang Li and Yongxin Ge and Jinyuan Feng and Xiaolei Qin and Jiaruo Yu and Hui Yu",
year = "2020",
month = jul,
day = "6",
doi = "10.1109/ICME46284.2020.9102727",
language = "English",
isbn = "978-1-7281-1332-6",
series = "Proceedings - IEEE International Conference on Multimedia and Expo",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
booktitle = "2020 IEEE International Conference on Multimedia and Expo, ICME 2020",
address = "United States",
note = "2020 IEEE International Conference on Multimedia and Expo, ICME 2020 ; Conference date: 06-07-2020 Through 10-07-2020",
}