%Aigaion2 BibTeX export from Idiap Publications
%Thursday 21 November 2024 01:02:57 PM

@INPROCEEDINGS{Schnell_SSW10_2019,
         author = {Schnell, Bastian and Garner, Philip N.},
       projects = {MASS},
          month = sep,
          title = {Neural VTLN for Speaker Adaptation in TTS},
      booktitle = {Proc. 10th ISCA Speech Synthesis Workshop},
           year = {2019},
          pages = {6},
       location = {Vienna, Austria},
   organization = {ISCA},
            doi = {10.21437/ssw.2019-6},
       abstract = {Vocal tract length normalisation (VTLN) is well established as a  speaker  adaptation  technique  that  can  work  with  very  little adaptation data. It is also well known that VTLN can be cast as a linear transform in the cepstral domain.  Building on this latter property, we show that it can be cast as a (linear) layer in a deep neural network (DNN) for speech synthesis. We show that VTLN parameters can then be trained in the same framework as the rest of the DNN using automatic gradients.  Experimental results show that the DNN is capable of predicting phone-dependent warpings on artificial data,  and that such warpings improve the quality of an acoustic model on real data in subjective listening tests.},
            pdf = {https://publications.idiap.ch/attachments/papers/2019/Schnell_SSW10_2019.pdf}
}