%Aigaion2 BibTeX export from Idiap Publications %Thursday 21 November 2024 01:03:59 PM @ARTICLE{Dines_CSL_2011, author = {Dines, John and Liang, Hui and Saheer, Lakshmi and Gibson, Matthew and Byrne, William and Oura, Keiichiro and Tokuda, Keiichi and Yamagishi, Junichi and King, Simon and Wester, Mirjam and Hirsim{\"{a}}ki, Teemu and Karhila, Reima and Kurimo, Mikko}, keywords = {cross-lingual speaker adaptation, Machine Translation, speech recognition, speech synthesis}, projects = {Idiap, EMIME}, title = {Personalising speech-to-speech translation: Unsupervised cross-lingual speaker adaptation for HMM-based speech synthesis}, journal = {Computer Speech and Language}, year = {2011}, url = {http://www.sciencedirect.com/science/article/pii/S0885230811000441}, doi = {doi:10.1016/j.csl.2011.08.003}, abstract = {In this paper we present results of unsupervised cross-lingual speaker adaptation applied to text-to-speech synthesis. The application of our research is the personalisation of speech-to-speech translation in which we employ a HMM statistical framework for both speech recognition and synthesis. This framework provides a logical mechanism to adapt synthesised speech output to the voice of the user by way of speech recognition. In this work we present results of several different unsupervised and cross-lingual adaptation approaches as well as an end-to-end speaker adaptive speech-to-speech translation system. Our experiments show that we can successfully apply speaker adaptation in both unsupervised and cross-lingual scenarios and our proposed algorithms seem to generalise well for several language pairs. We also discuss important future directions including the need for better evaluation metrics.}, pdf = {https://publications.idiap.ch/attachments/papers/2011/Dines_CSL_2011.pdf} }