@inbook{172cebf1c3634a4d9ab6a9ec282d7ba9,
title = "Synergistic Face Detection and Pose Estimation with Energy-Based Models",
abstract = "We describe a novel method for real-time, simultaneous multi-view face detection and facial pose estimation. The method employs a convolutional network to map face images to points on a manifold, parametrized by pose, and non-face images to points far from that manifold. This network is trained by optimizing a loss function of three variables: image, pose, and face/non-face label. We test the resulting system, in a single configuration, on three standard data sets – one for frontal pose, one for rotated faces, and one for profiles – and find that its performance on each set is comparable to previous multi-view face detectors that can only handle one form of pose variation. We also show experimentally that the system{\textquoteright}s accuracy on both face detection and pose estimation is improved by training for the two tasks together.",
author = "Margarita Osadchy and \{Le Cun\}, Yann and Miller, \{Matthew L.\}",
year = "2006",
doi = "10.1007/11957959\_10",
language = "English",
isbn = "978-3-540-68794-8",
series = "Lecture Notes in Computer Science",
publisher = "Springer Berlin Heidelberg",
pages = "196--206",
editor = "Jean Ponce and Martial Hebert and Cordelia Schmid and Andrew Zisserman",
booktitle = "Toward Category-Level Object Recognition",
}