@inproceedings{7d9413fd95ba4518b60de9195e22fe00,
title = "Wake-up-word detection by estimating formants from spatial eigenspace information",
abstract = "Wake-up-word (WUW) detection is to detect a single word or phrase while rejecting all other words or sounds. For distant human-robot interaction (HRI), the location of the target speaker and a unique command are required to activate the robot. In this paper, a multi-channel speech interface is introduced not only to estimate the unknown locations of the sound sources but also to strengthen the speech feature for WUW detection. A ring-shape microphone array is used to collect the speech signal. The spatial eigenspace information discovered by multiple signal classification (MUSIC) is used to estimate location dependent formants and the direction of the target speaker. The estimated formants contained in fixed time duration are grouped and evaluated using the likelihood functions of formants. A cascaded detector is also introduced to make the final decision. Experimental results demonstrate the usefulness of the proposed approach with several noisy conditions, including the cases of simultaneous competing speeches.",
author = "Jwu-Sheng Hu and Lee, {Ming Tang} and Xiao, {Yun Xuan}",
year = "2012",
month = oct,
day = "23",
doi = "10.1109/ICMA.2012.6285132",
language = "English",
isbn = "9781467312776",
series = "2012 IEEE International Conference on Mechatronics and Automation, ICMA 2012",
pages = "2019--2024",
booktitle = "2012 IEEE International Conference on Mechatronics and Automation, ICMA 2012",
note = "null ; Conference date: 05-08-2012 Through 08-08-2012",
}