@inproceedings{oai:nitech.repo.nii.ac.jp:00003410, author = {Kazumi, Kyousuke and Nankaku, Yoshihiko and 南角, 吉彦 and Tokuda, Keiichi}, book = {ICASSP 2010. IEEE International Conference on Acoustics, Speech and Signal Processing, 2010.}, month = {}, note = {application/pdf, This paper describes factor analyzed voice models for realizing various voice characteristics in the HMM-based speech synthesis. The eigenvoice method can synthesize speech with arbitrary voice characteristics by interpolating representative HMM sets. However, the objective of PCA is to accurately reconstruct each speaker-dependent HMM set, and this is not equivalent to estimating models which represent training data accurately. To overcome this problem, we propose a general speech model which generates speech utterances with various voice characteristics directly. In the proposed method, the HMM states, factors representing voice characteristics and contextual decision trees are simultaneously optimized within a unified framework., 14-19 March 2010 Dallas, TX, USA}, pages = {4234--4237}, publisher = {Institute of Electrical and Electronics Engineers}, title = {Factor Analyzed Voice Models for HMM-Based Speech Synthesis}, year = {2010}, yomi = {ナンカク, ヨシヒコ} }