@inproceedings{a46b41b11414495bbfa87acd0318a255,
title = "Maximising audiovisual correlation with automatic lip tracking and vowel based segmentation",
abstract = "In recent years, the established link between the various human communication production domains has become more widely utilised in the field of speech processing. In this work, a state of the art Semi Adaptive Appearance Model (SAAM) approach developed by the authors is used for automatic lip tracking, and an adapted version of our vowel based speech segmentation system is employed to automatically segment speech. Canonical Correlation Analysis (CCA) on segmented and non segmented data in a range of noisy speech environments finds that segmented speech has a significantly better audiovisual correlation, demonstrating the feasibility of our techniques for further development as part of a proposed audiovisual speech enhancement system.",
keywords = "canonical correlation, canonical correlation analysis, noisy environment, speech enhancement, visual speech",
author = "Andrew Abel and Amir Hussain and Nguyen, {Quoc Dinh} and Fabien Ringeval and Mohamed Chetouani and Maurice Milgram",
year = "2009",
month = sep,
day = "7",
doi = "10.1007/978-3-642-04391-8_9",
language = "English",
isbn = "3642043909",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer",
pages = "65--72",
editor = "Julian Fierrez and Javier Ortega-Garcia and Anna Esposito and Andrzej Drygajlo and Marcos Faundez-Zanuy",
booktitle = "Biometric ID Management and Multimodal Communication",
note = "Joint COST 2101 and 2102 International Conference on Biometric ID Management and Multimodal Communication, BioID_MultiComm 2009 ; Conference date: 16-09-2009 Through 18-09-2009",
}