{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,2]],"date-time":"2024-09-02T11:08:22Z","timestamp":1725275302705},"reference-count":184,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2021,11,1]],"date-time":"2021-11-01T00:00:00Z","timestamp":1635724800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2021,11,1]],"date-time":"2021-11-01T00:00:00Z","timestamp":1635724800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2021,11,1]],"date-time":"2021-11-01T00:00:00Z","timestamp":1635724800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2021,11,1]],"date-time":"2021-11-01T00:00:00Z","timestamp":1635724800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2021,11,1]],"date-time":"2021-11-01T00:00:00Z","timestamp":1635724800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,11,1]],"date-time":"2021-11-01T00:00:00Z","timestamp":1635724800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Signal Processing: Image Communication"],"published-print":{"date-parts":[[2021,11]]},"DOI":"10.1016\/j.image.2021.116479","type":"journal-article","created":{"date-parts":[[2021,9,6]],"date-time":"2021-09-06T21:13:54Z","timestamp":1630962834000},"page":"116479","update-policy":"http:\/\/dx.doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":14,"special_numbering":"C","title":["Head pose estimation: A survey of the last ten years"],"prefix":"10.1016","volume":"99","author":[{"ORCID":"http:\/\/orcid.org\/0000-0002-0864-5255","authenticated-orcid":false,"given":"Khalil","family":"Khan","sequence":"first","affiliation":[]},{"ORCID":"http:\/\/orcid.org\/0000-0003-3323-2732","authenticated-orcid":false,"given":"Rehan Ullah","family":"Khan","sequence":"additional","affiliation":[]},{"given":"Riccardo","family":"Leonardi","sequence":"additional","affiliation":[]},{"given":"Pierangelo","family":"Migliorati","sequence":"additional","affiliation":[]},{"ORCID":"http:\/\/orcid.org\/0000-0003-2152-9424","authenticated-orcid":false,"given":"Sergio","family":"Benini","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/j.image.2021.116479_b1","doi-asserted-by":"crossref","unstructured":"M. Voit, R. Stiefelhagen, Deducing the visual focus of attention from head pose estimation in dynamic multi-view meeting scenarios, in: Proceedings of the 10th International Conference on Multimodal Interfaces, 2008, pp. 173\u2013180.","DOI":"10.1145\/1452392.1452425"},{"issue":"1","key":"10.1016\/j.image.2021.116479_b2","doi-asserted-by":"crossref","first-page":"101","DOI":"10.1109\/TPAMI.2010.69","article-title":"Multiperson visual focus of attention from head pose and meeting contextual cues","volume":"33","author":"Ba","year":"2010","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"2","key":"10.1016\/j.image.2021.116479_b3","doi-asserted-by":"crossref","first-page":"802","DOI":"10.1109\/TIP.2011.2162740","article-title":"Combining head pose and eye location information for gaze estimation","volume":"21","author":"Valenti","year":"2011","journal-title":"IEEE Trans. Image Process."},{"issue":"2","key":"10.1016\/j.image.2021.116479_b4","doi-asserted-by":"crossref","first-page":"300","DOI":"10.1109\/TITS.2010.2044241","article-title":"Head pose estimation and augmented reality tracking: An integrated system and evaluation for monitoring driver awareness","volume":"11","author":"Murphy-Chutorian","year":"2010","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"key":"10.1016\/j.image.2021.116479_b5","series-title":"2018 13th IEEE International Conference on Automatic Face & Gesture Recognition (FG 2018)","first-page":"789","article-title":"Human computer interaction with head pose, eye gaze and body gestures","author":"Wang","year":"2018"},{"key":"10.1016\/j.image.2021.116479_b6","series-title":"2007 7th IEEE-RAS International Conference on Humanoid Robots","first-page":"330","article-title":"Feature-based head pose estimation from images","author":"Vatahska","year":"2007"},{"key":"10.1016\/j.image.2021.116479_b7","series-title":"Proceedings of the 2016 ACM on International Conference on Multimedia Retrieval","first-page":"281","article-title":"Multimodal deep convolutional neural network for audio-visual emotion recognition","author":"Zhang","year":"2016"},{"issue":"3","key":"10.1016\/j.image.2021.116479_b8","doi-asserted-by":"crossref","first-page":"50","DOI":"10.3390\/mti3030050","article-title":"Exploring methods for predicting important utterances contributing to meeting summarization","volume":"3","author":"Nihei","year":"2019","journal-title":"Multimod. Technol. Interact."},{"key":"10.1016\/j.image.2021.116479_b9","unstructured":"S. Basu, T. Choudhury, B. Clarkson, A. Pentland, Towards measuring human interactions in conversational settings, in: Proc. IEEE CVPR Workshop on Cues in Communication, 2001."},{"key":"10.1016\/j.image.2021.116479_b10","series-title":"IEEE IV2003 Intelligent Vehicles Symposium. Proceedings (Cat. No. 03TH8683)","first-page":"444","article-title":"Driver\u2019s view and vehicle surround estimation using omnidirectional video stream","author":"Huang","year":"2003"},{"issue":"3","key":"10.1016\/j.image.2021.116479_b11","doi-asserted-by":"crossref","first-page":"305","DOI":"10.1109\/TPAMI.2005.49","article-title":"Automatic analysis of multimodal group actions in meetings","volume":"27","author":"McCowan","year":"2005","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"10.1016\/j.image.2021.116479_b12","series-title":"2007 IEEE International Conference on Multimedia and Expo","first-page":"1379","article-title":"A cognitive and unsupervised map adaptation approach to the recognition of the focus of attention from head pose","author":"Odobez","year":"2007"},{"issue":"4","key":"10.1016\/j.image.2021.116479_b13","doi-asserted-by":"crossref","first-page":"928","DOI":"10.1109\/TNN.2002.1021893","article-title":"Modeling focus of attention for meeting indexing based on multiple cues","volume":"13","author":"Stiefelhagen","year":"2002","journal-title":"IEEE Trans. Neural Netw."},{"key":"10.1016\/j.image.2021.116479_b14","series-title":"International Evaluation Workshop on Classification of Events, Activities and Relationships","first-page":"299","article-title":"Head pose estimation in seminar room using multi view face detectors","author":"Zhang","year":"2006"},{"key":"10.1016\/j.image.2021.116479_b15","series-title":"Proceedings of the 1st ACM International Workshop on Multimodal Pervasive Video Analysis","first-page":"37","article-title":"Space speaks: towards socially and personality aware visual surveillance","author":"Zen","year":"2010"},{"key":"10.1016\/j.image.2021.116479_b16","series-title":"Asian Conference on Computer Vision","first-page":"380","article-title":"Understanding interactions and guiding visual surveillance by tracking attention","author":"Reid","year":"2010"},{"key":"10.1016\/j.image.2021.116479_b17","series-title":"2011 Fifth ACM\/IEEE International Conference on Distributed Smart Cameras","first-page":"1","article-title":"Multiview social behavior analysis in work environments","author":"Chen","year":"2011"},{"key":"10.1016\/j.image.2021.116479_b18","series-title":"2007 IEEE Intelligent Transportation Systems Conference","first-page":"709","article-title":"Head pose estimation for driver assistance systems: A robust algorithm and experimental evaluation","author":"Murphy-Chutorian","year":"2007"},{"issue":"1","key":"10.1016\/j.image.2021.116479_b19","doi-asserted-by":"crossref","first-page":"117","DOI":"10.1016\/j.aei.2011.09.005","article-title":"Coarse head pose estimation of construction equipment operators to formulate dynamic blind spots","volume":"26","author":"Ray","year":"2012","journal-title":"Adv. Eng. Inform."},{"key":"10.1016\/j.image.2021.116479_b20","series-title":"Joint Pattern Recognition Symposium","first-page":"51","article-title":"Combined head localization and head pose estimation for video\u2013based advanced driver assistance systems","author":"Schulz","year":"2011"},{"issue":"6","key":"10.1016\/j.image.2021.116479_b21","first-page":"7","article-title":"Guiding visual surveillance by tracking human attention","volume":"2","author":"Benfold","year":"2009","journal-title":"BMVC"},{"key":"10.1016\/j.image.2021.116479_b22","series-title":"2011 IEEE Workshop on Applications of Computer Vision (WACV)","first-page":"519","article-title":"Tracking gaze direction from far-field surveillance cameras","author":"Sankaranarayanan","year":"2011"},{"issue":"7","key":"10.1016\/j.image.2021.116479_b23","doi-asserted-by":"crossref","first-page":"1212","DOI":"10.1109\/TPAMI.2007.70773","article-title":"Tracking the visual focus of attention for a varying number of wandering people","volume":"30","author":"Smith","year":"2008","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"114","key":"10.1016\/j.image.2021.116479_b24","first-page":"247","article-title":"Xiii. on the apparent direction of eyes in a portrait","author":"Wollaston","year":"1824","journal-title":"Philos. Trans. R. Soc. Lond."},{"issue":"5","key":"10.1016\/j.image.2021.116479_b25","doi-asserted-by":"crossref","first-page":"752","DOI":"10.3758\/BF03194970","article-title":"The influence of head contour and nose angle on the perception of eye-gaze direction","volume":"66","author":"Langton","year":"2004","journal-title":"Percept. Psychophys."},{"key":"10.1016\/j.image.2021.116479_b26","series-title":"2010 20th International Conference on Pattern Recognition","first-page":"934","article-title":"Head pose estimation based on random forests for multiclass classification","author":"Huang","year":"2010"},{"key":"10.1016\/j.image.2021.116479_b27","series-title":"2017 IEEE International Conference on Multimedia and Expo (ICME)","first-page":"175","article-title":"Head pose estimation through multi-class face segmentation","author":"Khan","year":"2017"},{"key":"10.1016\/j.image.2021.116479_b28","first-page":"1","article-title":"A framework for head pose estimation and face segmentation through conditional random fields","author":"Khan","year":"2019","journal-title":"Signal Imag. Video Process."},{"key":"10.1016\/j.image.2021.116479_b29","doi-asserted-by":"crossref","first-page":"21","DOI":"10.1016\/j.image.2019.01.005","article-title":"Face analysis through semantic face segmentation","volume":"74","author":"Benini","year":"2019","journal-title":"Signal Process., Image Commun."},{"issue":"7","key":"10.1016\/j.image.2021.116479_b30","doi-asserted-by":"crossref","first-page":"647","DOI":"10.3390\/e21070647","article-title":"A unified framework for head pose, age and gender classification through end-to-end face segmentation","volume":"21","author":"Khan","year":"2019","journal-title":"Entropy"},{"key":"10.1016\/j.image.2021.116479_b31","series-title":"2015 IEEE International Conference on Image Processing (ICIP)","first-page":"827","article-title":"Multi-class semantic segmentation of faces","author":"Khan","year":"2015"},{"issue":"4","key":"10.1016\/j.image.2021.116479_b32","doi-asserted-by":"crossref","first-page":"607","DOI":"10.1109\/TPAMI.2008.106","article-title":"Head pose estimation in computer vision: A survey","volume":"31","author":"Murphy-Chutorian","year":"2008","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"10.1016\/j.image.2021.116479_b33","series-title":"2018 13th IEEE International Conference on Automatic Face & Gesture Recognition (FG 2018)","first-page":"67","article-title":"Vggface2: A dataset for recognising faces across pose and age","author":"Cao","year":"2018"},{"key":"10.1016\/j.image.2021.116479_b34","doi-asserted-by":"crossref","unstructured":"J. Gu, X. Yang, S. De\u00a0Mello, J. Kautz, Dynamic facial analysis: From bayesian filtering to recurrent neural network, in: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2017, pp. 1548\u20131557.","DOI":"10.1109\/CVPR.2017.167"},{"key":"10.1016\/j.image.2021.116479_b35","series-title":"2017 12th IEEE International Conference on Automatic Face & Gesture Recognition (FG 2017)","first-page":"809","article-title":"Joint challenge on dominant and complementary emotion recognition using micro emotion features and head-pose estimation: Databases","author":"L\u00fcsi","year":"2017"},{"key":"10.1016\/j.image.2021.116479_b36","doi-asserted-by":"crossref","first-page":"42","DOI":"10.1016\/j.neucom.2015.03.096","article-title":"Robust head pose estimation using Dirichlet-tree distribution enhanced random forests","volume":"173","author":"Liu","year":"2016","journal-title":"Neurocomputing"},{"key":"10.1016\/j.image.2021.116479_b37","series-title":"2016 IEEE International Conference on Image Processing (ICIP)","first-page":"1289","article-title":"3D head pose estimation with convolutional neural network trained on synthetic images","author":"Liu","year":"2016"},{"key":"10.1016\/j.image.2021.116479_b38","series-title":"2014 22nd International Conference on Pattern Recognition","first-page":"2263","article-title":"Robust real-time extreme head pose estimation","author":"Tulyakov","year":"2014"},{"issue":"3","key":"10.1016\/j.image.2021.116479_b39","doi-asserted-by":"crossref","first-page":"437","DOI":"10.1007\/s11263-012-0549-0","article-title":"Random forests for real time 3d face analysis","volume":"101","author":"Fanelli","year":"2013","journal-title":"Int. J. Comput. Vis."},{"issue":"3","key":"10.1016\/j.image.2021.116479_b40","doi-asserted-by":"crossref","first-page":"437","DOI":"10.1007\/s11263-012-0549-0","article-title":"Random forests for real time 3d face analysis","volume":"101","author":"Fanelli","year":"2013","journal-title":"Int. J. Comput. Vis."},{"issue":"1","key":"10.1016\/j.image.2021.116479_b41","doi-asserted-by":"crossref","first-page":"495","DOI":"10.1007\/s11042-012-1352-1","article-title":"Robust semi-automatic head pose labeling for real-world face video sequences","volume":"70","author":"Demirkus","year":"2014","journal-title":"Multimedia Tools Appl."},{"key":"10.1016\/j.image.2021.116479_b42","series-title":"2012 IEEE Conference on Computer Vision and Pattern Recognition","first-page":"2610","article-title":"3D constrained local model for rigid and non-rigid facial tracking","author":"Baltru\u0161aitis","year":"2012"},{"key":"10.1016\/j.image.2021.116479_b43","series-title":"2012 IEEE Conference on Computer Vision and Pattern Recognition","first-page":"2879","article-title":"Face detection, pose estimation, and landmark localization in the wild","author":"Zhu","year":"2012"},{"key":"10.1016\/j.image.2021.116479_b44","series-title":"2011 IEEE International Conference on Computer Vision Workshops (ICCV Workshops)","first-page":"2144","article-title":"Annotated facial landmarks in the wild: A large-scale, real-world database for facial landmark localization","author":"Koestinger","year":"2011"},{"issue":"5","key":"10.1016\/j.image.2021.116479_b45","doi-asserted-by":"crossref","first-page":"807","DOI":"10.1016\/j.imavis.2009.08.002","article-title":"Multi-pie","volume":"28","author":"Gross","year":"2010","journal-title":"Image Vis. Comput."},{"key":"10.1016\/j.image.2021.116479_b46","first-page":"020","article-title":"BJUT-3D large scale 3D face database and information processing","volume":"6","author":"Baocai","year":"2009","journal-title":"J. Comput. Res. Dev."},{"key":"10.1016\/j.image.2021.116479_b47","series-title":"2008 IEEE Conference on Computer Vision and Pattern Recognition","first-page":"1","article-title":"Real-time face pose estimation from single range images","author":"Breitenstein","year":"2008"},{"key":"10.1016\/j.image.2021.116479_b48","series-title":"ICPR International Workshop on Visual Observation of Deictic Gestures","article-title":"Estimating face orientation from robust detection of salient facial features","author":"Gourier","year":"2004"},{"issue":"4","key":"10.1016\/j.image.2021.116479_b49","doi-asserted-by":"crossref","first-page":"322","DOI":"10.1109\/34.845375","article-title":"Fast, reliable head tracking under varying illumination: An approach based on registration of texture-mapped 3D models","volume":"22","author":"La\u00a0Cascia","year":"2000","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"6","key":"10.1016\/j.image.2021.116479_b50","doi-asserted-by":"crossref","first-page":"84","DOI":"10.1109\/MCG.2011.92","article-title":"3D rotations","volume":"31","author":"Taubin","year":"2011","journal-title":"IEEE Comput. Graph. Appl."},{"key":"10.1016\/j.image.2021.116479_b51","series-title":"Consumer Depth Cameras for Computer Vision","first-page":"3","article-title":"3D with kinect","author":"Smisek","year":"2013"},{"key":"10.1016\/j.image.2021.116479_b52","series-title":"2008 IEEE Conference on Computer Vision and Pattern Recognition","first-page":"1","article-title":"Real-time face pose estimation from single range images","author":"Breitenstein","year":"2008"},{"key":"10.1016\/j.image.2021.116479_b53","doi-asserted-by":"crossref","first-page":"206","DOI":"10.1016\/j.neucom.2017.05.033","article-title":"Multi-level structured hybrid forest for joint head detection and pose estimation","volume":"266","author":"Liu","year":"2017","journal-title":"Neurocomputing"},{"issue":"7","key":"10.1016\/j.image.2021.116479_b54","doi-asserted-by":"crossref","first-page":"1502","DOI":"10.1109\/TNNLS.2015.2441735","article-title":"Compound rank-k projections for bilinear analysis","volume":"27","author":"Chang","year":"2015","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"key":"10.1016\/j.image.2021.116479_b55","doi-asserted-by":"crossref","unstructured":"A. Schwarz, M. Haurilet, M. Martinez, R. Stiefelhagen, Driveahead-a large-scale driver head pose dataset, in: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition Workshops, 2017, pp. 1\u201310.","DOI":"10.1109\/CVPRW.2017.155"},{"key":"10.1016\/j.image.2021.116479_b56","series-title":"Proceedings CVPR IEEE Computer Society Conference on Computer Vision and Pattern Recognition","first-page":"223","article-title":"Recognition of planar object classes","author":"Burl","year":"1996"},{"key":"10.1016\/j.image.2021.116479_b57","series-title":"3D Pose Estimation and Normalization for Face Recognition","author":"Jebara","year":"1995"},{"key":"10.1016\/j.image.2021.116479_b58","series-title":"Image Analysis","first-page":"319","article-title":"Head pose estimation using multi-scale Gaussian derivatives","author":"Jain","year":"2013"},{"key":"10.1016\/j.image.2021.116479_b59","doi-asserted-by":"crossref","first-page":"455","DOI":"10.1016\/j.neucom.2014.07.019","article-title":"VoD: a novel image representation for head yaw estimation","volume":"148","author":"Ma","year":"2015","journal-title":"Neurocomputing"},{"key":"10.1016\/j.image.2021.116479_b60","series-title":"2009 IEEE Conference on Computer Vision and Pattern Recognition","first-page":"612","article-title":"Robustifying eye center localization by head pose cues","author":"Valenti","year":"2009"},{"issue":"3","key":"10.1016\/j.image.2021.116479_b61","doi-asserted-by":"crossref","first-page":"469","DOI":"10.1007\/s11042-008-0240-1","article-title":"Estimation of behavioral user state based on eye gaze and head pose\u2014application in an e-learning environment","volume":"41","author":"Asteriadis","year":"2009","journal-title":"Multimedia Tools Appl."},{"issue":"02","key":"10.1016\/j.image.2021.116479_b62","doi-asserted-by":"crossref","first-page":"193","DOI":"10.1142\/S0218213097000116","article-title":"A model-based gaze tracking system","volume":"6","author":"Stiefelhagen","year":"1997","journal-title":"Int. J. Artif. Intell. Tools"},{"key":"10.1016\/j.image.2021.116479_b63","unstructured":"F.H. Zavan, A.C. Nascimento, O.R. Bellon, L. Silva, Nosepose: a competitive, landmark-free methodology for head pose estimation in the wild, in: Conf. on Graphics, Patterns and Images-W. Face Processing 2016, 2016."},{"key":"10.1016\/j.image.2021.116479_b64","doi-asserted-by":"crossref","unstructured":"M. Svanera, U. Muhammad, R. Leonardi, S. Benini, Figaro, hair detection and segmentation in the wild, in: 2016 IEEE International Conference on Image Processing (ICIP), 2016, pp. 933\u2013937.","DOI":"10.1109\/ICIP.2016.7532494"},{"key":"10.1016\/j.image.2021.116479_b65","doi-asserted-by":"crossref","first-page":"25","DOI":"10.1016\/j.imavis.2018.02.001","article-title":"Hair detection, segmentation, and hairstyle classification in the wild","volume":"71","author":"Muhammad","year":"2018","journal-title":"Image Vis. Comput."},{"issue":"1","key":"10.1016\/j.image.2021.116479_b66","doi-asserted-by":"crossref","first-page":"38","DOI":"10.1006\/cviu.1995.1004","article-title":"Active shape models-their training and application","volume":"61","author":"Cootes","year":"1995","journal-title":"Comput. Vis. Image Underst."},{"issue":"8","key":"10.1016\/j.image.2021.116479_b67","doi-asserted-by":"crossref","first-page":"1565","DOI":"10.1016\/S0031-3203(00)00091-1","article-title":"Fusion of perceptual cues for robust tracking of head pose and position","volume":"34","author":"Sherrah","year":"2001","journal-title":"Pattern Recognit."},{"key":"10.1016\/j.image.2021.116479_b68","series-title":"Facial Feature Extraction and Determination of Pose","first-page":"257","author":"Nikolaidis","year":"1998"},{"issue":"3","key":"10.1016\/j.image.2021.116479_b69","doi-asserted-by":"crossref","first-page":"1138","DOI":"10.1016\/j.patcog.2007.07.017","article-title":"A two-stage head pose estimation framework and evaluation","volume":"41","author":"Wu","year":"2008","journal-title":"Pattern Recognit."},{"key":"10.1016\/j.image.2021.116479_b70","doi-asserted-by":"crossref","first-page":"5457","DOI":"10.1109\/TIP.2020.2984373","article-title":"Web-shaped model for head pose estimation: An approach for best exemplar selection","volume":"29","author":"Barra","year":"2020","journal-title":"IEEE Trans. Image Process."},{"key":"10.1016\/j.image.2021.116479_b71","series-title":"Object Recognition Supported By User Interaction for Service Robots","first-page":"235","article-title":"Fast face detection with precise pose estimation","volume":"Vol. 1","author":"Fleuret","year":"2002"},{"key":"10.1016\/j.image.2021.116479_b72","series-title":"Learning to Learn","author":"Thrun","year":"2012"},{"issue":"1","key":"10.1016\/j.image.2021.116479_b73","doi-asserted-by":"crossref","first-page":"83","DOI":"10.1109\/TMM.2012.2225039","article-title":"Modeling functional roles dynamics in small group interactions","volume":"15","author":"Dong","year":"2012","journal-title":"IEEE Trans. Multimed."},{"issue":"1","key":"10.1016\/j.image.2021.116479_b74","doi-asserted-by":"crossref","first-page":"121","DOI":"10.1109\/TPAMI.2017.2781233","article-title":"Hyperface: A deep multi-task learning framework for face detection, landmark localization, pose estimation, and gender recognition","volume":"41","author":"Ranjan","year":"2017","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"10.1016\/j.image.2021.116479_b75","doi-asserted-by":"crossref","unstructured":"X. Zhu, Z. Lei, X. Liu, H. Shi, S.Z. Li, Face alignment across large poses: A 3d solution, in: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2016, pp. 146\u2013155.","DOI":"10.1109\/CVPR.2016.23"},{"key":"10.1016\/j.image.2021.116479_b76","series-title":"Proceedings of IEEE Computer Society Conference on Computer Vision and Pattern Recognition","first-page":"144","article-title":"Parametrized structure from motion for 3D adaptive feedback tracking of faces","author":"Jebara","year":"1997"},{"key":"10.1016\/j.image.2021.116479_b77","series-title":"Proceedings of the 10th International Conference on Multimodal Interfaces","first-page":"173","article-title":"Deducing the visual focus of attention from head pose estimation in dynamic multi-view meeting scenarios","author":"Voit","year":"2008"},{"issue":"4","key":"10.1016\/j.image.2021.116479_b78","doi-asserted-by":"crossref","first-page":"607","DOI":"10.1109\/TPAMI.2008.106","article-title":"Head pose estimation in computer vision: A survey","volume":"31","author":"Murphy-Chutorian","year":"2008","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"10","key":"10.1016\/j.image.2021.116479_b79","doi-asserted-by":"crossref","first-page":"639","DOI":"10.1016\/0262-8856(94)90039-6","article-title":"Determining the gaze of faces in images","volume":"12","author":"Gee","year":"1994","journal-title":"Image Vis. Comput."},{"key":"10.1016\/j.image.2021.116479_b80","series-title":"2017 12th IEEE International Conference on Automatic Face & Gesture Recognition (FG 2017)","first-page":"17","article-title":"An all-in-one convolutional neural network for face analysis","author":"Ranjan","year":"2017"},{"key":"10.1016\/j.image.2021.116479_b81","series-title":"2017 12th IEEE International Conference on Automatic Face & Gesture Recognition (FG 2017)","first-page":"258","article-title":"KEPLER: keypoint and pose estimation of unconstrained faces by learning efficient H-CNN regressors","author":"Kumar","year":"2017"},{"issue":"2","key":"10.1016\/j.image.2021.116479_b82","doi-asserted-by":"crossref","first-page":"802","DOI":"10.1109\/TIP.2011.2162740","article-title":"Combining head pose and eye location information for gaze estimation","volume":"21","author":"Valenti","year":"2011","journal-title":"IEEE Trans. Image Process."},{"key":"10.1016\/j.image.2021.116479_b83","series-title":"2011 IEEE International Conference on Computer Vision Workshops (ICCV Workshops)","first-page":"1713","article-title":"Appearance-based head pose estimation with scene-specific adaptation","author":"Chamveha","year":"2011"},{"issue":"1","key":"10.1016\/j.image.2021.116479_b84","doi-asserted-by":"crossref","first-page":"16","DOI":"10.1109\/TSMCB.2008.927274","article-title":"Recognizing visual focus of attention from head pose in natural meetings","volume":"39","author":"Ba","year":"2008","journal-title":"IEEE Trans. Syst. Man Cybern. B"},{"issue":"1","key":"10.1016\/j.image.2021.116479_b85","doi-asserted-by":"crossref","first-page":"39","DOI":"10.1007\/s11760-012-0421-2","article-title":"3D head pose estimation and camera mouse implementation using a monocular video camera","volume":"9","author":"Nabati","year":"2015","journal-title":"Signal Imag. Video Process."},{"issue":"5500","key":"10.1016\/j.image.2021.116479_b86","doi-asserted-by":"crossref","first-page":"2268","DOI":"10.1126\/science.290.5500.2268","article-title":"The manifold ways of perception","volume":"290","author":"Seung","year":"2000","journal-title":"Science"},{"key":"10.1016\/j.image.2021.116479_b87","series-title":"2007 IEEE Conference on Computer Vision and Pattern Recognition","first-page":"1","article-title":"Biased manifold embedding: A framework for person-independent head pose estimation","author":"Balasubramanian","year":"2007"},{"key":"10.1016\/j.image.2021.116479_b88","series-title":"European Conference on Computer Vision","first-page":"518","article-title":"Robust head pose estimation using supervised manifold learning","author":"BenAbdelkader","year":"2010"},{"key":"10.1016\/j.image.2021.116479_b89","series-title":"CVPR 2011","first-page":"2921","article-title":"Supervised local subspace learning for continuous head pose estimation","author":"Huang","year":"2011"},{"key":"10.1016\/j.image.2021.116479_b90","series-title":"2010 IEEE International Conference on Image Processing","first-page":"3277","article-title":"Multi-manifold modeling for head pose estimation","author":"Liu","year":"2010"},{"key":"10.1016\/j.image.2021.116479_b91","series-title":"Proceedings Fourth IEEE International Conference on Automatic Face and Gesture Recognition (Cat. No. PR00580)","first-page":"300","article-title":"Support vector regression and classification based multi-view face detection and recognition","author":"Li","year":"2000"},{"issue":"5","key":"10.1016\/j.image.2021.116479_b92","doi-asserted-by":"crossref","first-page":"413","DOI":"10.1016\/j.imavis.2003.12.005","article-title":"Support vector machine based multi-view face detection and recognition","volume":"22","author":"Li","year":"2004","journal-title":"Image Vis. Comput."},{"key":"10.1016\/j.image.2021.116479_b93","series-title":"2007 IEEE Intelligent Transportation Systems Conference","first-page":"709","article-title":"Head pose estimation for driver assistance systems: A robust algorithm and experimental evaluation","author":"Murphy-Chutorian","year":"2007"},{"key":"10.1016\/j.image.2021.116479_b94","series-title":"18th International Conference on Pattern Recognition (ICPR\u201906)","first-page":"507","article-title":"Sparse bayesian regression for head pose estimation","volume":"Vol. 3","author":"Ma","year":"2006"},{"key":"10.1016\/j.image.2021.116479_b95","series-title":"2004 International Conference on Image Processing, 2004. ICIP\u201904","first-page":"75","article-title":"Estimating facial pose from a sparse representation [face recognition applications]","volume":"Vol. 1","author":"Moon","year":"2004"},{"key":"10.1016\/j.image.2021.116479_b96","series-title":"Neural Networks for Pattern Recognition","author":"Bishop","year":"1995"},{"key":"10.1016\/j.image.2021.116479_b97","series-title":"Pattern Classification","author":"Duda","year":"2001"},{"key":"10.1016\/j.image.2021.116479_b98","series-title":"Workshop on Motion and Video Computing, 2002. Proceedings","first-page":"125","article-title":"Comparative study of coarse head pose estimation","author":"Brown","year":"2002"},{"key":"10.1016\/j.image.2021.116479_b99","series-title":"International Workshop on Automatic Face-and Gesture-Recognition","article-title":"Gaze tracking based on face-color","volume":"Vol. 476","author":"Schiele","year":"1995"},{"key":"10.1016\/j.image.2021.116479_b100","series-title":"Proceedings. International Conference on Image Processing","first-page":"I","article-title":"Real-time head orientation estimation using neural networks","volume":"Vol. 1","author":"Zhao","year":"2002"},{"key":"10.1016\/j.image.2021.116479_b101","series-title":"2007 IEEE International Conference on Multimedia and Expo","first-page":"1810","article-title":"Query driven localized linear discriminant models for head pose estimation","author":"Li","year":"2007"},{"key":"10.1016\/j.image.2021.116479_b102","series-title":"Proceedings.(ICASSP\u201905). IEEE International Conference on Acoustics, Speech, and Signal Processing, 2005","first-page":"ii","article-title":"A methodology for evaluating robustness of face recognition algorithms with respect to variations in pose angle and illumination angle","volume":"Vol. 2","author":"Little","year":"2005"},{"issue":"7","key":"10.1016\/j.image.2021.116479_b103","doi-asserted-by":"crossref","first-page":"743","DOI":"10.1109\/34.598231","article-title":"Automatic interpretation and coding of face images using flexible models","volume":"19","author":"Lanitis","year":"1997","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"10.1016\/j.image.2021.116479_b104","first-page":"2278","article-title":"Gradient-based learning applied to document recognition","volume":"86","author":"LeCun","year":"1998"},{"key":"10.1016\/j.image.2021.116479_b105","series-title":"Proceedings Eighth IEEE International Conference on Computer Vision. ICCV 2001","first-page":"674","article-title":"Kernel machine based learning for multi-view face detection and pose estimation","volume":"Vol. 2","author":"Li","year":"2001"},{"issue":"2","key":"10.1016\/j.image.2021.116479_b106","doi-asserted-by":"crossref","first-page":"91","DOI":"10.1023\/B:VISI.0000029664.99615.94","article-title":"Distinctive image features from scale-invariant keypoints","volume":"60","author":"Lowe","year":"2004","journal-title":"Int. J. Comput. Vis."},{"key":"10.1016\/j.image.2021.116479_b107","series-title":"18th International Conference on Pattern Recognition (ICPR\u201906)","first-page":"512","article-title":"Robust head pose estimation using LGBP","volume":"Vol. 2","author":"Ma","year":"2006"},{"key":"10.1016\/j.image.2021.116479_b108","series-title":"Proceedings of IEEE Computer Society Conference on Computer Vision and Pattern Recognition","first-page":"144","article-title":"Parametrized structure from motion for 3D adaptive feedback tracking of faces","author":"Jebara","year":"1997"},{"key":"10.1016\/j.image.2021.116479_b109","series-title":"Proceedings Fourth IEEE International Conference on Automatic Face and Gesture Recognition (Cat. No. PR00580)","first-page":"169","article-title":"A robust model-based approach for 3d head tracking in video sequences","author":"Malciu","year":"2000"},{"issue":"2","key":"10.1016\/j.image.2021.116479_b110","doi-asserted-by":"crossref","first-page":"135","DOI":"10.1023\/B:VISI.0000029666.37597.d3","article-title":"Active appearance models revisited","volume":"60","author":"Matthews","year":"2004","journal-title":"Int. J. Comput. Vis."},{"key":"10.1016\/j.image.2021.116479_b111","doi-asserted-by":"crossref","unstructured":"G.P. Meyer, S. Gupta, I. Frosio, D. Reddy, J. Kautz, Robust model-based 3d head pose estimation, in: Proceedings of the IEEE International Conference on Computer Vision, 2015, pp. 3649\u20133657.","DOI":"10.1109\/ICCV.2015.416"},{"key":"10.1016\/j.image.2021.116479_b112","series-title":"2017 12th IEEE International Conference on Automatic Face & Gesture Recognition (FG 2017)","first-page":"711","article-title":"Robust and accurate 3d head pose estimation through 3dmm and online head model reconstruction","author":"Yu","year":"2017"},{"key":"10.1016\/j.image.2021.116479_b113","series-title":"Proceedings of the 2nd Workshop on Computational Models of Social Interactions: Human-Computer-Media Communication","first-page":"25","article-title":"Highly accurate and fully automatic head pose estimation from a low quality consumer-level rgb-d sensor","author":"Ghiass","year":"2015"},{"key":"10.1016\/j.image.2021.116479_b114","doi-asserted-by":"crossref","unstructured":"C. Papazov, T.K. Marks, M. Jones, Real-time 3D head pose and facial landmark estimation from depth images using triangular surface patch features, in: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2015, pp. 4722\u20134730.","DOI":"10.1109\/CVPR.2015.7299104"},{"key":"10.1016\/j.image.2021.116479_b115","series-title":"Robust 3d head tracking by view-based feature point registration","author":"Jang","year":"2010"},{"issue":"2\u20134","key":"10.1016\/j.image.2021.116479_b116","doi-asserted-by":"crossref","first-page":"158","DOI":"10.1007\/s11263-017-0988-8","article-title":"Real-time accurate 3D head tracking and pose estimation with consumer rgb-d cameras","volume":"126","author":"Tan","year":"2018","journal-title":"Int. J. Comput. Vis."},{"issue":"12","key":"10.1016\/j.image.2021.116479_b117","doi-asserted-by":"crossref","first-page":"2444","DOI":"10.1109\/TPAMI.2016.2522441","article-title":"Joint head pose\/soft label estimation for human recognition in-the-wild","volume":"38","author":"Proenca","year":"2016","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"10.1016\/j.image.2021.116479_b118","series-title":"2008 8th IEEE International Conference on Automatic Face & Gesture Recognition","first-page":"1","article-title":"Generalized adaptive view-based appearance model: Integrated framework for monocular head pose estimation","author":"Morency","year":"2008"},{"key":"10.1016\/j.image.2021.116479_b119","series-title":"2012 IEEE Conference on Computer Vision and Pattern Recognition","first-page":"2610","article-title":"3D constrained local model for rigid and non-rigid facial tracking","author":"Baltru\u0161aitis","year":"2012"},{"key":"10.1016\/j.image.2021.116479_b120","series-title":"2015 IEEE International Conference on Image Processing (ICIP)","first-page":"4624","article-title":"Head pose estimation via probabilistic high-dimensional regression","author":"Drouard","year":"2015"},{"key":"10.1016\/j.image.2021.116479_b121","series-title":"Proceedings. Fourteenth International Conference on Pattern Recognition (Cat. No. 98EX170)","first-page":"154","article-title":"Face pose discrimination using support vector machines (SVM)","volume":"Vol. 1","author":"Huang","year":"1998"},{"key":"10.1016\/j.image.2021.116479_b122","series-title":"International Evaluation Workshop on Classification of Events, Activities and Relationships","first-page":"299","article-title":"Head pose estimation in seminar room using multi view face detectors","author":"Zhang","year":"2006"},{"issue":"2","key":"10.1016\/j.image.2021.116479_b123","doi-asserted-by":"crossref","first-page":"77","DOI":"10.1109\/MSP.2011.942737","article-title":"Modeling dynamical influence in human interaction: Using data to make better inferences about influence within social systems","volume":"29","author":"Pan","year":"2012","journal-title":"IEEE Signal Process. Mag."},{"key":"10.1016\/j.image.2021.116479_b124","doi-asserted-by":"crossref","DOI":"10.1016\/j.dib.2019.103881","article-title":"FASSEG: A face semantic segmentation repository for face image analysis","volume":"24","author":"Benini","year":"2019","journal-title":"Data Brief"},{"issue":"1","key":"10.1016\/j.image.2021.116479_b125","doi-asserted-by":"crossref","first-page":"121","DOI":"10.1109\/TPAMI.2017.2781233","article-title":"Hyperface: A deep multi-task learning framework for face detection, landmark localization, pose estimation, and gender recognition","volume":"41","author":"Ranjan","year":"2017","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"10.1016\/j.image.2021.116479_b126","series-title":"2018 13th IEEE International Conference on Automatic Face & Gesture Recognition (FG 2018)","first-page":"59","article-title":"Openface 2.0: Facial behavior analysis toolkit","author":"Baltrusaitis","year":"2018"},{"key":"10.1016\/j.image.2021.116479_b127","doi-asserted-by":"crossref","unstructured":"N. Ruiz, E. Chong, J.M. Rehg, Fine-grained head pose estimation without keypoints, in: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition Workshops, 2018, pp. 2074\u20132083.","DOI":"10.1109\/CVPRW.2018.00281"},{"issue":"4","key":"10.1016\/j.image.2021.116479_b128","doi-asserted-by":"crossref","first-page":"1035","DOI":"10.1109\/TMM.2018.2866770","article-title":"Quatnet: Quaternion-based head pose estimation with multiregression loss","volume":"21","author":"Hsu","year":"2018","journal-title":"IEEE Trans. Multimed."},{"key":"10.1016\/j.image.2021.116479_b129","series-title":"IT Convergence and Security 2017","first-page":"164","article-title":"Head pose estimation using convolutional neural network","author":"Lee","year":"2018"},{"key":"10.1016\/j.image.2021.116479_b130","doi-asserted-by":"crossref","first-page":"132","DOI":"10.1016\/j.patcog.2017.06.009","article-title":"Head pose estimation in the wild using convolutional neural networks and adaptive gradient methods","volume":"71","author":"Patacchiola","year":"2017","journal-title":"Pattern Recognit."},{"key":"10.1016\/j.image.2021.116479_b131","doi-asserted-by":"crossref","unstructured":"F. Kuhnke, J. Ostermann, Deep head pose estimation using synthetic images and partial adversarial domain adaption for continuous label spaces, in: Proceedings of the IEEE International Conference on Computer Vision, 2019, pp. 10164\u201310173.","DOI":"10.1109\/ICCV.2019.01026"},{"issue":"7","key":"10.1016\/j.image.2021.116479_b132","doi-asserted-by":"crossref","first-page":"3952","DOI":"10.1109\/TII.2018.2884211","article-title":"Multimodal face-pose estimation with multitask manifold deep learning","volume":"15","author":"Hong","year":"2018","journal-title":"IEEE Trans. Ind. Inf."},{"key":"10.1016\/j.image.2021.116479_b133","series-title":"2009 Sixth IEEE International Conference on Advanced Video and Signal Based Surveillance","first-page":"296","article-title":"A 3D face model for pose and illumination invariant face recognition","author":"Paysan","year":"2009"},{"key":"10.1016\/j.image.2021.116479_b134","series-title":"ICPR International Workshop on Visual Observation of Deictic Gestures","article-title":"Estimating face orientation from robust detection of salient facial features","author":"Gourier","year":"2004"},{"key":"10.1016\/j.image.2021.116479_b135","doi-asserted-by":"crossref","first-page":"42458","DOI":"10.1109\/ACCESS.2020.2977346","article-title":"An end-to-end task-simplified and anchor-guided deep learning framework for image-based head pose estimation","volume":"8","author":"Li","year":"2020","journal-title":"IEEE Access"},{"key":"10.1016\/j.image.2021.116479_b136","series-title":"ICASSP 2020-2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","first-page":"1883","article-title":"Leveraging ordinal regression with soft labels for 3d head pose estimation from point sets","author":"Xiao","year":"2020"},{"key":"10.1016\/j.image.2021.116479_b137","doi-asserted-by":"crossref","DOI":"10.1016\/j.patcog.2020.107316","article-title":"Single image-based head pose estimation with spherical parametrization and 3D morphing","author":"Yuan","year":"2020","journal-title":"Pattern Recognit."},{"key":"10.1016\/j.image.2021.116479_b138","doi-asserted-by":"crossref","unstructured":"T.-Y. Yang, Y.-T. Chen, Y.-Y. Lin, Y.-Y. Chuang, FSA-net: learning fine-grained structure aggregation for head pose estimation from a single image, in: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2019, pp. 1087\u20131096.","DOI":"10.1109\/CVPR.2019.00118"},{"key":"10.1016\/j.image.2021.116479_b139","series-title":"ICASSP 2019-2019 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","first-page":"1977","article-title":"Nose, eyes and ears: Head pose estimation by locating facial keypoints","author":"Gupta","year":"2019"},{"key":"10.1016\/j.image.2021.116479_b140","series-title":"VISIGRAPP (5: VISAPP)","first-page":"123","article-title":"Combined framework for real-time head pose estimation using facial landmark detection and salient feature tracking","author":"Barros","year":"2018"},{"key":"10.1016\/j.image.2021.116479_b141","series-title":"VISIGRAPP (5: VISAPP)","first-page":"123","article-title":"Combined framework for real-time head pose estimation using facial landmark detection and salient feature tracking","author":"Barros","year":"2018"},{"key":"10.1016\/j.image.2021.116479_b142","series-title":"Proceedings of the 2nd Workshop on Computational Models of Social Interactions: Human-Computer-Media Communication","first-page":"25","article-title":"Highly accurate and fully automatic head pose estimation from a low quality consumer-level rgb-d sensor","author":"Ghiass","year":"2015"},{"key":"10.1016\/j.image.2021.116479_b143","series-title":"2018 IEEE Winter Conference on Applications of Computer Vision (WACV)","first-page":"75","article-title":"3D head pose estimation enhanced through SURF-based key-frames","author":"Madrigal","year":"2018"},{"key":"10.1016\/j.image.2021.116479_b144","series-title":"2017 12th IEEE International Conference on Automatic Face & Gesture Recognition (FG 2017)","first-page":"820","article-title":"Head pose estimation based on 3-D facial landmarks localization and regression","author":"Derkach","year":"2017"},{"key":"10.1016\/j.image.2021.116479_b145","series-title":"2017 12th IEEE International Conference on Automatic Face & Gesture Recognition (FG 2017)","first-page":"642","article-title":"Joint head pose estimation and face alignment framework using global and local CNN features","author":"Xu","year":"2017"},{"key":"10.1016\/j.image.2021.116479_b146","series-title":"2017 IEEE International Conference on Image Processing (ICIP)","first-page":"121","article-title":"Real-time monocular 6-DoF head pose estimation from salient 2D points","author":"Barros","year":"2017"},{"key":"10.1016\/j.image.2021.116479_b147","series-title":"2016 IEEE International Conference on Image Processing (ICIP)","first-page":"1289","article-title":"3D head pose estimation with convolutional neural network trained on synthetic images","author":"Liu","year":"2016"},{"key":"10.1016\/j.image.2021.116479_b148","series-title":"Face alignment assisted by head pose estimation","author":"Yang","year":"2015"},{"issue":"8","key":"10.1016\/j.image.2021.116479_b149","doi-asserted-by":"crossref","first-page":"1871","DOI":"10.1007\/s11760-014-0676-x","article-title":"Head pose estimation based on face symmetry analysis","volume":"9","author":"Dahmane","year":"2015","journal-title":"Signal Imag. Video Process."},{"key":"10.1016\/j.image.2021.116479_b150","series-title":"2015 11th IEEE International Conference and Workshops on Automatic Face and Gesture Recognition (FG)","first-page":"1","article-title":"Automatic 3d facial expression recognition using geometric scattering representation","volume":"Vol. 1","author":"Yang","year":"2015"},{"key":"10.1016\/j.image.2021.116479_b151","series-title":"CVPR 2011","first-page":"617","article-title":"Real time head pose estimation with random regression forests","author":"Fanelli","year":"2011"},{"issue":"12","key":"10.1016\/j.image.2021.116479_b152","doi-asserted-by":"crossref","first-page":"2234","DOI":"10.1109\/TPAMI.2007.70733","article-title":"Automatic age estimation based on facial aging patterns","volume":"29","author":"Geng","year":"2007","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"10.1016\/j.image.2021.116479_b153","series-title":"2014 2nd International Conference on 3D Vision","first-page":"641","article-title":"Real time head model creation and head pose estimation on consumer depth cameras","volume":"Vol. 1","author":"Martin","year":"2014"},{"key":"10.1016\/j.image.2021.116479_b154","series-title":"Scandinavian Conference on Image Analysis","first-page":"319","article-title":"Head pose estimation using multi-scale gaussian derivatives","author":"Jain","year":"2013"},{"key":"10.1016\/j.image.2021.116479_b155","series-title":"VISAPP (2)","first-page":"223","article-title":"3D face pose tracking using low quality depth cameras","author":"Rekik","year":"2013"},{"key":"10.1016\/j.image.2021.116479_b156","series-title":"2012 IEEE Computer Society Conference on Computer Vision and Pattern Recognition Workshops","first-page":"42","article-title":"Head pose estimation on depth data based on particle swarm optimization","author":"Padeleris","year":"2012"},{"key":"10.1016\/j.image.2021.116479_b157","series-title":"CVPR 2011","first-page":"617","article-title":"Real time head pose estimation with random regression forests","author":"Fanelli","year":"2011"},{"key":"10.1016\/j.image.2021.116479_b158","series-title":"2011 18th IEEE International Conference on Image Processing","first-page":"3617","article-title":"Robust head pose estimation via convex regularized sparse regression","author":"Ji","year":"2011"},{"key":"10.1016\/j.image.2021.116479_b159","series-title":"Proceedings of the Seventh Indian Conference on Computer Vision, Graphics and Image Processing","first-page":"162","article-title":"A robust head pose estimation system for uncalibrated monocular videos","author":"Prasad","year":"2010"},{"key":"10.1016\/j.image.2021.116479_b160","series-title":"2010 IEEE International Conference on Image Processing","first-page":"3277","article-title":"Multi-manifold modeling for head pose estimation","author":"Liu","year":"2010"},{"key":"10.1016\/j.image.2021.116479_b161","series-title":"2017 IEEE International Conference on Multimedia and Expo (ICME)","first-page":"175","article-title":"Head pose estimation through multi-class face segmentation","author":"Khan","year":"2017"},{"key":"10.1016\/j.image.2021.116479_b162","doi-asserted-by":"crossref","first-page":"97","DOI":"10.1016\/j.neucom.2014.06.014","article-title":"CovGa: A novel descriptor based on symmetry of regions for head pose estimation","volume":"143","author":"Ma","year":"2014","journal-title":"Neurocomputing"},{"key":"10.1016\/j.image.2021.116479_b163","doi-asserted-by":"crossref","unstructured":"V. Kazemi, J. Sullivan, One millisecond face alignment with an ensemble of regression trees, in: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2014, pp. 1867\u20131874.","DOI":"10.1109\/CVPR.2014.241"},{"key":"10.1016\/j.image.2021.116479_b164","doi-asserted-by":"crossref","unstructured":"A. Bulat, G. Tzimiropoulos, How far are we from solving the 2d & 3d face alignment problem?(and a dataset of 230,000 3d facial landmarks), in: Proceedings of the IEEE International Conference on Computer Vision, 2017, pp. 1021\u20131030.","DOI":"10.1109\/ICCV.2017.116"},{"key":"10.1016\/j.image.2021.116479_b165","series-title":"2016 IEEE Winter Conference on Applications of Computer Vision (WACV)","first-page":"1","article-title":"Openface: an open source facial behavior analysis toolkit","author":"Baltru\u0161aitis","year":"2016"},{"issue":"2","key":"10.1016\/j.image.2021.116479_b166","doi-asserted-by":"crossref","first-page":"200","DOI":"10.1007\/s11263-010-0380-4","article-title":"Deformable model fitting by regularized landmark mean-shift","volume":"91","author":"Saragih","year":"2011","journal-title":"Int. J. Comput. Vis."},{"key":"10.1016\/j.image.2021.116479_b167","doi-asserted-by":"crossref","first-page":"13","DOI":"10.1016\/j.imavis.2016.05.009","article-title":"Dense 3d face alignment from 2d video for real-time use","volume":"58","author":"Jeni","year":"2017","journal-title":"Image Vis. Comput."},{"issue":"4","key":"10.1016\/j.image.2021.116479_b168","doi-asserted-by":"crossref","first-page":"2014","DOI":"10.1109\/TITS.2015.2396031","article-title":"Driver gaze tracking and eyes off the road detection system","volume":"16","author":"Vicente","year":"2015","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"key":"10.1016\/j.image.2021.116479_b169","doi-asserted-by":"crossref","unstructured":"Y. Wu, C. Gou, Q. Ji, Simultaneous facial landmark detection, pose and deformation estimation under facial occlusion, in: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2017, pp. 3471\u20133480.","DOI":"10.1109\/CVPR.2017.606"},{"key":"10.1016\/j.image.2021.116479_b170","doi-asserted-by":"crossref","unstructured":"A. Asthana, S. Zafeiriou, S. Cheng, M. Pantic, Incremental face alignment in the wild, in: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2014, pp. 1859\u20131866.","DOI":"10.1109\/CVPR.2014.240"},{"issue":"2","key":"10.1016\/j.image.2021.116479_b171","doi-asserted-by":"crossref","first-page":"178","DOI":"10.1007\/s11263-008-0185-x","article-title":"Pose-invariant facial expression recognition using variable-intensity templates","volume":"83","author":"Kumano","year":"2009","journal-title":"Int. J. Comput. Vis."},{"key":"10.1016\/j.image.2021.116479_b172","series-title":"IJCAI","first-page":"7","article-title":"SSR-net: A compact soft stagewise regression network for age estimation","volume":"Vol. 5","author":"Yang","year":"2018"},{"issue":"6","key":"10.1016\/j.image.2021.116479_b173","doi-asserted-by":"crossref","first-page":"681","DOI":"10.1109\/34.927467","article-title":"Active appearance models","author":"Cootes","year":"2001","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"8","key":"10.1016\/j.image.2021.116479_b174","doi-asserted-by":"crossref","first-page":"1871","DOI":"10.1007\/s11760-014-0676-x","article-title":"Head pose estimation based on face symmetry analysis","volume":"9","author":"Dahmane","year":"2015","journal-title":"Signal Imag. Video Process."},{"issue":"4","key":"10.1016\/j.image.2021.116479_b175","doi-asserted-by":"crossref","first-page":"607","DOI":"10.1109\/TPAMI.2008.106","article-title":"Head pose estimation in computer vision: A survey","volume":"31","author":"Murphy-Chutorian","year":"2008","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"2","key":"10.1016\/j.image.2021.116479_b176","doi-asserted-by":"crossref","first-page":"257","DOI":"10.1109\/72.661121","article-title":"Recognition of human head orientation based on artificial neural networks","volume":"9","author":"Rae","year":"1998","journal-title":"IEEE Trans. Neural Netw."},{"key":"10.1016\/j.image.2021.116479_b177","series-title":"Proceedings International Workshop on Recognition, Analysis, and Tracking of Faces and Gestures in Real-Time Systems. in Conjunction with ICCV\u201999 (Cat. No. PR00378)","first-page":"14","article-title":"Multi-view face detection and pose estimation using a composite support vector machine across the view sphere","author":"Ng","year":"1999"},{"key":"10.1016\/j.image.2021.116479_b178","first-page":"I","article-title":"Adaptive view-based appearance models","volume":"Vol. 1","author":"Morency","year":"2003"},{"issue":"18","key":"10.1016\/j.image.2021.116479_b179","doi-asserted-by":"crossref","first-page":"4831","DOI":"10.1080\/01431160802672864","article-title":"Effect of errors in ground truth on classification accuracy","volume":"30","author":"Carlotto","year":"2009","journal-title":"Int. J. Remote Sens."},{"issue":"1","key":"10.1016\/j.image.2021.116479_b180","doi-asserted-by":"crossref","first-page":"44","DOI":"10.1093\/nsr\/nwx106","article-title":"A brief introduction to weakly supervised learning","volume":"5","author":"Zhou","year":"2018","journal-title":"Nat. Sci. Rev."},{"key":"10.1016\/j.image.2021.116479_b181","unstructured":"Y.-H. Hubert\u00a0Tsai, Y.-R. Yeh, Y.-C. Frank\u00a0Wang, Learning cross-domain landmarks for heterogeneous domain adaptation, in: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2016, pp. 5081\u20135090."},{"issue":"1\u20132","key":"10.1016\/j.image.2021.116479_b182","doi-asserted-by":"crossref","first-page":"28","DOI":"10.1007\/s11263-014-0719-3","article-title":"Asymmetric and category invariant feature transformations for domain adaptation","volume":"109","author":"Hoffman","year":"2014","journal-title":"Int. J. Comput. Vis."},{"key":"10.1016\/j.image.2021.116479_b183","series-title":"Towards good practices for very deep two-stream convnets","author":"Wang","year":"2015"},{"key":"10.1016\/j.image.2021.116479_b184","doi-asserted-by":"crossref","unstructured":"A. Karpathy, G. Toderici, S. Shetty, T. Leung, R. Sukthankar, L. Fei-Fei, Large-scale video classification with convolutional neural networks, in: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2014, pp. 1725\u20131732.","DOI":"10.1109\/CVPR.2014.223"}],"container-title":["Signal Processing: Image Communication"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0923596521002332?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0923596521002332?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2023,3,5]],"date-time":"2023-03-05T19:27:13Z","timestamp":1678044433000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0923596521002332"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,11]]},"references-count":184,"alternative-id":["S0923596521002332"],"URL":"https:\/\/doi.org\/10.1016\/j.image.2021.116479","relation":{},"ISSN":["0923-5965"],"issn-type":[{"value":"0923-5965","type":"print"}],"subject":[],"published":{"date-parts":[[2021,11]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"Head pose estimation: A survey of the last ten years","name":"articletitle","label":"Article Title"},{"value":"Signal Processing: Image Communication","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.image.2021.116479","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2021 Elsevier B.V. All rights reserved.","name":"copyright","label":"Copyright"}],"article-number":"116479"}}