@conference {73, title = {The computer expression recognition toolbox (CERT)}, booktitle = {2011 IEEE International Conference on Automatic Face Gesture Recognition and Workshops (FG 2011)}, year = {2011}, month = {03/2011}, publisher = {IEEE}, organization = {IEEE}, address = {Santa Barbara, CA}, abstract = {

We present the Computer Expression Recognition Toolbox (CERT), a software tool for fully automatic real-time facial expression recognition, and officially release it for free academic use. CERT can automatically code the intensity of 19 different facial actions from the Facial Action Unit Coding System (FACS) and 6 different prototypical facial expressions. It also estimates the locations of 10 facial features as well as the 3-D orientation (yaw, pitch, roll) of the head. On a database of posed facial expressions, Extended Cohn-Kanade (CK+[1]), CERT achieves an average recognition performance (probability of correctness on a two-alternative forced choice (2AFC) task between one positive and one negative example) of 90.1\% when analyzing facial actions. On a spontaneous facial expression dataset, CERT achieves an accuracy of nearly 80\%. In a standard dual core laptop, CERT can process 320 {\texttimes} 240 video images in real time at approximately 10 frames per second.

}, keywords = {3D orientation, Accuracy, automatic real-time facial expression recognition, CERT, computer expression recognition toolbox, Detectors, dual core laptop, Emotion recognition, Encoding, extended Cohn-Kanade, Face, face recognition, facial action unit coding system, facial expression dataset, Facial features, FACS, Gold, Image coding, software tool, software tools, two-alternative forced choice task}, isbn = {978-1-4244-9140-7}, author = {Littlewort, G. and Whitehill, J. and Wu, T. and Fasel, I. and Frank, M. and Movellan, J. and Bartlett, M.} } @article {69, title = {Toward Practical Smile Detection}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence}, volume = {31}, year = {2009}, month = {11/2009}, pages = {2106-2111}, chapter = {2106}, abstract = {

Machine learning approaches have produced some of the highest reported performances for facial expression recognition. However, to date, nearly all automatic facial expression recognition research has focused on optimizing performance on a few databases that were collected under controlled lighting conditions on a relatively small number of subjects. This paper explores whether current machine learning methods can be used to develop an expression recognition system that operates reliably in more realistic conditions. We explore the necessary characteristics of the training data set, image registration, feature representation, and machine learning algorithms. A new database, GENKI, is presented which contains pictures, photographed by the subjects themselves, from thousands of different people in many different real-world imaging conditions. Results suggest that human-level expression recognition accuracy in real-life illumination conditions is achievable with machine learning technology. However, the data sets currently used in the automatic expression recognition literature to evaluate progress may be overly constrained and could potentially lead research into locally optimal algorithmic solutions.

}, keywords = {Algorithms, Artificial intelligence, Automated, automatic facial expression recognition research, Biological Pattern Recognition, Biometry, Computer simulation, Computer vision, Computer-Assisted, Face, Face and gesture recognition, face recognition, feature representation, human-level expression recognition accuracy, illumination conditions, Image databases, Image Enhancement, Image Interpretation, image registration image representation, learning (artificial intelligence), machine learning approaches, Machine Learning Models, n Humans, object detection, practical smile detection, Reproducibility of Results, Sensitivity and Specificity, Smiling, Subtraction Technique, training data set, visual databases}, issn = {0162-8828}, author = {Whitehill, J. and Littlewort, G. and Fasel, I. and Bartlett, M. and Movellan, J.} } @conference {59, title = {Building a more effective teaching robot using apprenticeship learning}, booktitle = {7th IEEE International Conference on Development and Learning, 2008. ICDL 2008}, year = {2008}, month = {08/2008}, publisher = {IEE}, organization = {IEE}, address = {Monterey, CA}, abstract = {

What defines good teaching? While attributes such as timing, responsiveness to social cues, and pacing of material clearly play a role, it is difficult to create a comprehensive specification of what it means to be a good teacher. On the other hand, it is relatively easy to obtain examples of expert teaching behavior by observing a real teacher. With this inspiration as our guide, we investigated apprenticeship learning methods [1] that use data recorded from expert teachers as a means of improving the teaching abilities of RUBI, a social robot immersed in a classroom of 18-24 month old children. While this approach has achieved considerable success in mechanical control, such as automated helicopter flight [2], until now there has been little work on applying it to the field of social robotics. This paper explores two particular approaches to apprenticeship learning, and analyzes the models of teaching that each approach learns from the data of the human teacher. Empirical results indicate that the apprenticeship learning paradigm, though still nascent in its use in the social robotics field, holds promise, and that our proposed methods can already extract meaningful teaching models from demonstrations of a human expert.

}, keywords = {apprenticeship learning, automated helicopter flight, Automatic control, Data mining, Delay, education, Educational robots, expert teaching, Helicopters, Human-robot interaction, humanoid robots, Humans Learning systems, mechanical control, robot teaching, Robotics and Automation, RUBI social robot, time 18 month to 24 month, timing}, isbn = {978-1-4244-2661-4}, author = {Ruvolo, P. and Whitehill, J. and Virnes, M. and Movellan, J.} } @conference {62, title = {A discriminative approach to frame-by-frame head pose tracking}, booktitle = {8th IEEE International Conference on Automatic Face Gesture Recognition, 2008. FG {\textquoteright}08}, year = {2008}, month = {09/2008}, publisher = {IEEE}, organization = {IEEE}, address = {Amsterdam}, abstract = {

We present a discriminative approach to frame-by-frame head pose tracking that is robust to a wide range of illuminations and facial appearances and that is inherently immune to accuracy drift. Most previous research on head pose tracking has been validated on test datasets spanning only a small (\< 20) subjects under controlled illumination conditions on continuous video sequences. In contrast, the system presented in this paper was both trained and tested on a much larger database, GENKI, spanning tens of thousands of different subjects, illuminations, and geographical locations from images on the Web. Our pose estimator achieves accuracy of 5.82deg, 5.65deg, and 2.96deg root-mean-square (RMS) error for yaw, pitch, and roll, respectively. A set of 4000 images from this dataset, labeled for pose, was collected and released for use by the research community.

}, keywords = {accuracy drift, continuous video sequence, controlled illumination condition, discriminative approach, face detection, face recognition, facial appearance, frame-by-frame head pose tracking, Humans, Image analysis, Image databases, Laboratories, Lighting, Magnetic heads, mean square error methods, pose estimation, Robustness, root-mean-square error tracking, System testing, Video sequences}, isbn = {978-1-4244-2153-4}, author = {Whitehill, J. and Movellan, Javier R.} }