@inbook{72d6c997f95145dca192d24644f51fd6,
title = "Exploiting Alternatives for Text-To-Speech Synthesis: From Machine to Human",
abstract = "The absence of alternatives/variants is a dramatical limitation of text-to-speech (TTS) synthesis compared to the variety of human speech. This chapter introduces the use of speech alternatives/variants in order to improve TTS synthesis systems. Speech alternatives denote the variety of possibilities that a speaker has to pronounce a sentence—depending on linguistic constraints, specific strategies of the speaker, speaking style, and pragmatic constraints. During the training, symbolic and acoustic characteristics of a unit-selection speech synthesis system are statistically modelled with context-dependent parametric models (Gaussian mixture models (GMMs)/hidden Markov models (HMMs)). During the synthesis, symbolic and acoustic alternatives are exploited using a Generalized Viterbi Algorithm (GVA) to determine the sequence of speech units used for the synthesis. Objective and subjective evaluations support evidence that the use of speech alternatives significantly improves speech synthesis over conventional speech synthesis systems. Moreover, speech alternatives can also be used to vary the speech synthesis for a given text. The proposed method can easily be extended to HMM-based speech synthesis.",
author = "Nicolas Obin and Christophe Veaux and Pierre Lanchantin",
year = "2015",
month = feb,
day = "26",
doi = "10.1007/978-3-662-45258-5_13",
language = "English",
isbn = "978-3-662-45257-8",
series = "Prosody, Phonology and Phonetics",
publisher = "Springer",
pages = "189--202",
editor = "Keikichi Hirose and Jianhua Tao",
booktitle = "Speech Prosody in Speech Synthesis: Modeling and generation of prosody for high quality and flexible speech synthesis",
address = "United Kingdom",
}