@Article{Brinckmann_Trouvain:2003,
AUTHOR = {Brinckmann, Caren and Trouvain, Jürgen},
TITLE = {The Role of Duration Models and Symbolic Representation for Timing in Synthetic Speech},
YEAR = {2003},
MONTH = {January},
JOURNAL = {International Journal of Speech Technology},
VOLUME = {6},
NUMBER = {1},
PAGES = {21-23},
URL = {http://dx.doi.org/10.1023/A:1021043804581},
ABSTRACT = {In order to determine priorities for the improvement of timing in synthetic speech this study looks at the role of segmental duration prediction and the role of phonological symbolic representation in the perceptual quality of a text-to-speech system. In perception experiments using German speech synthesis, two standard duration models (Klatt rules and CART) were tested. The input to these models consisted of a symbolic representation which was either derived from a database or a text-to-speech system. Results of the perception experiments show that different duration models can only be distinguished when the symbolic representation is appropriate. Considering the relative importance of the symbolic representation, post-lexical segmental rules were investigated with the outcome that listeners differ in their preferences regarding the degree of segmental reduction. As a conclusion, before fine-tuning the duration prediction, it is important to derive an appropriate phonological symbolic representation in order to improve timing in synthetic speech.} }
|