@inproceedings{34e82fb5026f4dcd850c1c1b22108090,
title = "A robust hierarchical LIP tracking approach for lipreading and audio visual speech recognition",
abstract = "This paper presents a robust hierarchical lip tracking approach (RoHiLTA) for lipreading and audio visual speech recognition (AVSR) applications. Lip regions of interest are subtly detected by motion and facial structure information. Improvements are made on Active Shape Models (ASMs) for extracting lip contours more accurately and efficiently from video sequences of a speaker's talking face in natural lighting conditions and without particular make-ups. Local and global ASM search algorithms are both improved by introducing color information, 2D mouth corner match, and robust estimation. For noise-free features, localization errors are automatically corrected by an interpolating scheme. A fast implementation of the hierarchical approach is also proposed. Extensive experiments show that the improved ASM can effectively reduce the lip locating errors. The fast implementation of RoHiLTA can consistently achieve superior performance to conventional ASMs in lip tracking tasks, and then can be effectively integrated in lipreading and AVSR systems.",
keywords = "Active shape model, Audio visual speech recognition, Lip tracking, Lipreading",
author = "Lei Xie and Cai, \{Xiu Li\} and Fu, \{Zhong Hua\} and Zhao, \{Rong Chun\} and Jiang, \{Dong Mei\}",
year = "2004",
language = "英语",
isbn = "0780384032",
series = "Proceedings of 2004 International Conference on Machine Learning and Cybernetics",
pages = "3620--3624",
booktitle = "Proceedings of 2004 International Conference on Machine Learning and Cybernetics",
note = "Proceedings of 2004 International Conference on Machine Learning and Cybernetics ; Conference date: 26-08-2004 Through 29-08-2004",
}