@inproceedings{60211395b232406f85e37dfe9a071f55,
title = "Prosody-dependent acoustic modeling for mandarin speech recognition",
abstract = "A study on introducing prosodic information to acoustic modeling (AM) for speech recognition is reported in this paper. It extends the conventional context-dependent (CD) triphone HMM modeling approach to further consider the dependency of phone model on the break type of nearby inter-syllable boundary. Four break types are considered, including major break, minor break, normal non-break, and tightly-coupled non-break. In the training phase, break labeling is automatically accomplished by a Prosody Labeling and Modeling algorithm proposed previously. Then, prosody- and phonetic-dependent phone models are constructed by a standard decision tree-based context clustering of HMMs. The effectiveness of the new AM was examined on a Mandarin syllable recognition task. Experimental results showed that the new approach outperformed the conventional CD-AM on achieving better syllable recognition rate as well as on obtaining a more efficient syllable lattice with better compromise on complexity verse syllable coverage rate.",
keywords = "Acoustic modeling, Prosodic break, Prosody-dependent acoustic model, Speech recognition",
author = "Chiu, {Tzu Hsuan} and Chiang, {Chen Yu} and Liao, {Yuan Fu} and Yang, {Jyh Her} and Yih-Ru Wang and Sin-Horng Chen",
year = "2012",
month = jan,
day = "1",
language = "English",
isbn = "9787560848693",
series = "Proceedings of the 6th International Conference on Speech Prosody, SP 2012",
publisher = "Tongji University Press",
pages = "139--142",
booktitle = "Proceedings of the 6th International Conference on Speech Prosody, SP 2012",
address = "China",
note = "null ; Conference date: 22-05-2012 Through 25-05-2012",
}