@inproceedings{2fb3549e31c647af8d2d08040a302a33,
title = "Real-time head pose estimation by tracking and detection of keypoints and facial landmarks",
abstract = "We introduce a novel fusion framework for real-time head pose estimation using a tailored Kalman Filter. This approach estimates the pose from intensity images in monocular video data. The method is robust to extreme head rotations and varying illumination, with real-time capability. Our framework incorporates the head pose computed from a keypoint-based tracking scheme into the prediction step of the Kalman Filter and the head pose computed from a facial-landmark-based detection scheme into the correction step. The head pose from the tracking scheme is estimated from 2D keypoints tracked in two consecutive frames in the region of the head and their 3D projection on a simple geometric model. In contrast, the head pose from the detection scheme is estimated from 2D facial landmarks detected in each frame and their 3D correspondences retrieved through triangulation. In each scheme, the head pose results from the minimization of the reprojection error from the 3D-2D correspondences. In each iteration, we update the state transition matrix of the filter and subsequently the estimated covariance. We evaluated our approach on a publicly available dataset and compared with related methods of the state of the art. Our approach could achieve similar performance in terms of mean average error, while operating in real time. Furthermore, we tested our method on our own dataset, to evaluate its performance in the presence of large head rotations. We show good results even in cases where facial landmarks are partially occluded.",
keywords = "Detection, Facial landmarks, Head pose estimation, Kalman Filter, Keypoints, Real time, Tracking",
author = "{D{\'i}az Barros}, {Jilliam M.} and Bruno Mirbach and Frederic Garcia and Kiran Varanasi and Didier Stricker",
note = "Publisher Copyright: {\textcopyright} Springer Nature Switzerland AG 2019.; 13th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications, VISIGRAPP 2018 ; Conference date: 27-01-2018 Through 29-01-2018",
year = "2019",
doi = "10.1007/978-3-030-26756-8_16",
language = "English",
isbn = "9783030267551",
series = "Communications in Computer and Information Science",
publisher = "Springer Verlag",
pages = "326--349",
editor = "Dominique Bechmann and Manuela Chessa and Cl{\'a}udio, {Ana Paula} and Francisco Imai and Andreas Kerren and Paul Richard and Alexandru Telea and Alain Tremeau",
booktitle = "Computer Vision, Imaging and Computer Graphics Theory and Applications - 13th International Joint Conference, VISIGRAPP 2018, Revised Selected Papers",
address = "Germany",
}