The Centre for Speech Technology Research, The university of Edinburgh

Publications by Christophe Veaux

cveaux.bib

@inproceedings{Dall_Veaux_Yamagishi_King_Interspeech2012,
  author = {Dall, Rasmus and Veaux, Christophe and Yamagishi, Junichi and King, Simon},
  title = {Analysis of speaker clustering techniques for {HMM}-based speech synthesis},
  booktitle = {Proc. Interspeech},
  month = {September},
  year = {2012},
  pdf = {http://www.cstr.inf.ed.ac.uk/downloads/publications/2012/Dall_Veaux_Yamagishi_King_Interspeech2012.pdf},
  abstract = {This paper describes a method for speaker clustering, with the application of building average voice models for speaker-adaptive HMM-based speech synthesis that are a good basis for adapting to specific target speakers. Our main hypothesis is that using perceptually similar speakers to build the average voice model will be better than use unselected speakers, even if the amount of data available from perceptually similar speakers is smaller. We measure the perceived similarities among a group of 30 female speakers in a listening test and then apply multiple linear regression to automatically predict these listener judgements of speaker similarity and thus to identify similar speakers automatically. We then compare a variety of average voice models trained on either speakers who were perceptually judged to be similar to the target speaker, or speakers selected by the multiple linear regression, or a large global set of unselected speakers. We find that the average voice model trained on perceptually similar speakers provides better performance than the global model, even though the latter is trained on more data, confirming our main hypothesis. However, the average voice model using speakers selected automatically by the multiple linear regression does not reach the same level of performance.},
  categories = {Statistical parametric speech synthesis, hidden Markov models, speaker adaptation}
}
@article{2012E121001,
  author = {Yamagishi, Junichi and Veaux, Christophe and King, Simon and Renals, Steve},
  doi = {10.1250/ast.33.1},
  title = {Speech synthesis technologies for individuals with vocal disabilities: Voice banking and reconstruction},
  url = {http://www.jstage.jst.go.jp/browse/ast/33/1/_contents},
  journal = {Acoustical Science and Technology},
  number = {1},
  abstract = {In this invited paper, we overview the clinical applications of speech synthesis technologies and explain a few selected researches. We also introduce the University of Edinburgh’s new project ``Voice Banking and reconstruction'' for patients with degenerative diseases, such as motor neurone disease and Parkinson's disease and show how speech synthesis technologies can improve the quality of life for the patients.},
  volume = {33},
  year = {2012},
  pdf = {http://www.cstr.inf.ed.ac.uk/downloads/publications/2012/AST-33_1.pdf},
  pages = {1--5}
}
@inproceedings{wu2015adaptation,
  author = {Wu, Zhizheng and Swietojanski, Pawel and Veaux, Christophe and Renals, Steve and King, Simon},
  pdf = {http://www.cstr.inf.ed.ac.uk/downloads/publications/2015/is2015_dnn_adaptation.pdf},
  booktitle = {Interspeech},
  title = {A study of speaker adaptation for {DNN}-based speech synthesis},
  year = {2015}
}