@inproceedings{c5a3b34a7ee84513b7beffceca6faa4c,
title = "Residual attention regression for 3D hand pose estimation",
abstract = "3D hand pose estimation is an important and challenging task for virtual reality and human-computer interaction. In this paper, we propose a simple and effective residual attention regression model for accurate 3D hand pose estimation from a depth image. The model is trained in an end-to-end fashion. Specifically, we stack different attention modules to capture different types of attention-aware features, and then implement physical constraints of the hand by projecting the pose parameters into a lower-dimensional space. In this way, 3D coordinates of hand joints are estimated directly. The experimental results demonstrate that our proposed residual attention network can achieve superior or comparable performance on three main challenging datasets, where the average 3D error is 9.7 mm on the MSRA dataset, 7.8 mm on the ICVL dataset, and 17.6 mm on the NYU dataset.",
keywords = "3D hand pose estimation, Attention mechanism, Convolutional neural network, Depth images",
author = "Jing Li and Long Zhang and Zhaojie Ju",
year = "2019",
month = aug,
day = "3",
doi = "10.1007/978-3-030-27538-9_52",
language = "English",
isbn = "978-3-030-27537-2",
series = "Lecture Notes in Computer Science",
publisher = "Springer",
pages = "605--614",
editor = "Haibin Yu and Jinguo Liu and Lianqing Liu and Zhaojie Ju and Yuwang Liu and Dalin Zhou",
booktitle = "Intelligent Robotics and Applications",
note = "12th International Conference on Intelligent Robotics and Applications, ICIRA 2019 ; Conference date: 08-08-2019 Through 11-08-2019",
}