@inproceedings{acc6b2063ded46a0b0fefac556c6db2e,
title = "MTGLS: Multi-Task Gaze Estimation with Limited Supervision",
abstract = "Robust gaze estimation is a challenging task, even for deep CNNs, due to the non-availability of large-scale labeled data. Moreover, gaze annotation is a time-consuming process and requires specialized hardware setups. We propose MTGLS: a Multi-Task Gaze estimation framework with Limited Supervision, which leverages abundantly available non-annotated facial image data. MTGLS distills knowledge from off-the-shelf facial image analysis models, and learns strong feature representations of human eyes, guided by three complementary auxiliary signals: (a) the line of sight of the pupil (i.e. pseudo-gaze) defined by the localized facial landmarks, (b) the head-pose given by Euler angles, and (c) the orientation of the eye patch (left/right eye). To overcome inherent noise in the supervisory signals, MT-GLS further incorporates a noise distribution modelling approach. Our experimental results show that MTGLS learns highly generalized representations which consistently perform well on a range of datasets. Our proposed framework outperforms the unsupervised state-of-the-art on CAVE (by ∼ 6.43%) and even supervised state-of-the-art methods on Gaze360 (by ∼ 6.59%) datasets.",
keywords = "Biometrics, Face Processing Human-Computer Interaction, Few-shot, Large-scale Vision Applications, Semi- and Un- supervised Learning, Transfer",
author = "Shreya Ghosh and Munawar Hayat and Abhinav Dhall and Jarrod Knibbe",
year = "2022",
month = feb,
day = "15",
doi = "10.1109/WACV51458.2022.00123",
language = "English",
isbn = "978-1-6654-0916-2",
series = "IEEE Winter Conference on Applications of Computer Vision",
publisher = "Institute of Electrical and Electronics Engineers",
pages = "1161--1172",
booktitle = "Proceedings",
address = "United States",
note = "22nd IEEE/CVF Winter Conference on Applications of Computer Vision, WACV 2022 ; Conference date: 03-01-2022 Through 08-01-2022",
}