@article{ART001698053},
author={임기정 and Jungchul Lee},
title={Improvement of Naturalness for a HMM-based Korean TTS using the prosodic boundary information},
journal={Journal of The Korea Society of Computer and Information},
issn={1598-849X},
year={2012},
volume={17},
number={9},
pages={75-84}
TY - JOUR
AU - 임기정
AU - Jungchul Lee
TI - Improvement of Naturalness for a HMM-based Korean TTS using the prosodic boundary information
JO - Journal of The Korea Society of Computer and Information
PY - 2012
VL - 17
IS - 9
PB - The Korean Society Of Computer And Information
SP - 75
EP - 84
SN - 1598-849X
AB - HMM-based Text-to-Speech systems generally utilize context dependent tri-phone units from a large corpus speech DB to enhance the synthetic speech. To downsize a large corpus speech DB, acoustically similar tri-phone units are clustered based on the decision tree using context dependent information. Context dependent information includes phoneme sequence as well as prosodic information because the naturalness of synthetic speech highly depends on the prosody such as pause, intonation pattern, and segmental duration. However, if the prosodic information was complicated, many context dependent phonemes would have no examples in the training data, and clustering would provide a smoothed feature which will generate unnatural synthetic speech.
In this paper, instead of complicate prosodic information we propose a simple three prosodic boundary types and decision tree questions that use rising tone, falling tone, and monotonic tone to improve naturalness. Experimental results show that our proposed method can improve naturalness of a HMM-based Korean TTS and get high MOS in the perception test.
KW - HTS;HMM;tri-phone;decision tree-based clustering
DO -
UR -
ER -
임기정 and Jungchul Lee. (2012). Improvement of Naturalness for a HMM-based Korean TTS using the prosodic boundary information. Journal of The Korea Society of Computer and Information, 17(9), 75-84.
임기정 and Jungchul Lee. 2012, "Improvement of Naturalness for a HMM-based Korean TTS using the prosodic boundary information", Journal of The Korea Society of Computer and Information, vol.17, no.9 pp.75-84.
임기정, Jungchul Lee "Improvement of Naturalness for a HMM-based Korean TTS using the prosodic boundary information" Journal of The Korea Society of Computer and Information 17.9 pp.75-84 (2012) : 75.
임기정, Jungchul Lee. Improvement of Naturalness for a HMM-based Korean TTS using the prosodic boundary information. 2012; 17(9), 75-84.
임기정 and Jungchul Lee. "Improvement of Naturalness for a HMM-based Korean TTS using the prosodic boundary information" Journal of The Korea Society of Computer and Information 17, no.9 (2012) : 75-84.
임기정; Jungchul Lee. Improvement of Naturalness for a HMM-based Korean TTS using the prosodic boundary information. Journal of The Korea Society of Computer and Information, 17(9), 75-84.
임기정; Jungchul Lee. Improvement of Naturalness for a HMM-based Korean TTS using the prosodic boundary information. Journal of The Korea Society of Computer and Information. 2012; 17(9) 75-84.
임기정, Jungchul Lee. Improvement of Naturalness for a HMM-based Korean TTS using the prosodic boundary information. 2012; 17(9), 75-84.
임기정 and Jungchul Lee. "Improvement of Naturalness for a HMM-based Korean TTS using the prosodic boundary information" Journal of The Korea Society of Computer and Information 17, no.9 (2012) : 75-84.