@inbook{377c297573cf4dec8c924517564ca000,
title = "Monocular 3D human pose estimation using sparse motion features",
abstract = "In this paper we demonstrate that the motion of a sparse set of tracked features can be used to extract 3D pose from a single viewpoint. The purpose of this work is to illustrate the wealth of information present in the temporal dimension of a sequence of images that is currently not being exploited. Our approach is entirely dependent upon motion. We use low-level part detectors consisting of 3D motion models, these describe probabilistically how well the observed motion of a tracked feature fits each model. Given these initial detections a bottom-up approach is employed to find the most likely configuration of a person in each frame. Models used are learnt directly from motion capture data and no training is performed using descriptors derived from image sequences. The result is the presented approach can be applied to people moving at arbitrary and previously unseen orientations relative to the camera, making it particularly versatile and robust. We evaluate our approach for both walking and jogging on the HumanEva data set where we achieve an accuracy of 65.8{\^A}±23.3 mm and 69.4{\^A}±20.2 mm for each action respectively.",
keywords = "Humans, Motion estimation, Tracking, Data mining , Motion detection, Detectors, Image sequences, Cameras, Robustness, Legged locomotion, pose estimation, feature extraction, human eva data set",
author = "Ben Daubney and David Gibson and Neill Campbell",
year = "2009",
month = sep,
doi = "10.1109/ICCVW.2009.5457586",
language = "English",
isbn = "978-1-4244-4442-7",
series = "2009 IEEE 12th International Conference on Computer Vision Workshops (ICCV Workshops)",
publisher = "Institute of Electrical and Electronics Engineers",
pages = "1050--1057",
booktitle = "2009 IEEE 12th International Conference on Computer Vision Workshops (ICCV Workshops)",
}