references.bib

@inproceedings{Fayet2020,
    title        = {{FlexEval, création de sites web légers pour des campagnes de tests perceptifs multimédias}},
    author       = {Cédric Fayet and Alexis Blond and Grégoire Coulombel and Claude Simon and Damien Lolive and Gwénolé Lecorvé and Jonathan Chevelu and Sébastien {Le Maguer}},
    year         = 2020,
    booktitle    = {{Proceedings of JEP, TALN and RECITAL}},
    address      = {Nancy, France},
    pages        = {22--25},
    url          = {https://hal.archives-ouvertes.fr/hal-02768500},
    pdf          = {https://hal.archives-ouvertes.fr/hal-02768500v4/document},
    keywords     = {NAT},
}
@inproceedings{Lancucki2021,
    title        = {{Fastpitch: Parallel Text-to-Speech with Pitch Prediction}},
    author       = {{\L}a{\ifmmode\acute{n}\else\'{n}\fi}cucki, Adrian},
    year         = 2021,
    month        = jun,
    booktitle    = {{IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)}},
    publisher    = {IEEE},
    pages        = {6588--6592},
    doi          = {10.1109/ICASSP39728.2021.9413889},
    issn         = {2379-190X},
}
@article{Morise2016,
    title        = {{WORLD}: a vocoder-based high-quality speech synthesis system for real-time applications},
    author       = {Masanori Morise and Fumiya Yokomori and Kenji Ozawa},
    year         = 2016,
    journal      = {IEICE TRANSACTIONS on Information and Systems},
    publisher    = {The Institute of Electronics, Information and Communication Engineers},
    volume       = 99,
    number       = 7,
    pages        = {1877--1884},
    doi          = {10.1587/transinf.2015EDP7457},
}
@article{Oord2016,
    title        = {{WaveNet}: {A} Generative Model for Raw Audio},
    author       = {A{\"{a}}ron {Van den Oord} and Sander Dieleman and Heiga Zen and Karen Simonyan and Oriol Vinyals and Alex Graves and Nal Kalchbrenner and {Andrew W.} Senior and Koray Kavukcuoglu},
    year         = 2016,
    journal      = {CoRR},
    volume       = {abs/1609.03499},
    url          = {http://arxiv.org/abs/1609.03499},
    archiveprefix = {arXiv},
    eprint       = {1609.03499},
    timestamp    = {Mon, 13 Aug 2018 16:49:15 +0200},
    biburl       = {https://dblp.org/rec/bib/journals/corr/OordDZSVGKSK16},
    bibsource    = {dblp computer science bibliography, https://dblp.org},
}
@online{Valentini2020,
    title        = {{Tacotron + WaveRNN}},
    author       = {Cassia Valentini-Botinahao and Avashna Govender and Ollie McCarthy},
    year         = 2020,
    url          = {/~https://github.com/cassiavb/Tacotron/commit/946408f8cd7b5fe9c53931c631267ba2a723910d},
}
@online{Yamamoto2020b,
    title        = {{WaveNET}},
    author       = {Ryuichi Yamamoto},
    year         = 2020,
    url          = {/~https://github.com/r9y9/wavenet_vocoder/commit/a35fff76ea3687b05e1a10023cad3f7f64fa25a3},
}
@online{Hayashi2021,
    title        = {{Parallel WaveGAN}},
    author       = {Tomoki Hayashi},
    year         = 2021,
    url          = {/~https://github.com/kan-bayashi/ParallelWaveGAN/commit/6d4411b65f9487de5ec49dabf029dc107f23192d},
}
@online{NVIDIA2021,
    title        = {{FastPitch}},
    author       = {{NVIDIA Group}},
    year         = 2021,
    url          = {/~https://github.com/NVIDIA/DeepLearningExamples/commit/6a642837c471c596aab7edf204384f66e9483ab2},
}
@inproceedings{Steiner2018,
    title        = {{Creating New Language and Voice Components for the Updated MaryTTS Text-to-Speech Synthesis Platform}},
    author       = {Ingmar Steiner and Sébastien Le Maguer},
    year         = 2018,
    booktitle    = {International Conference on Language Resources and Evaluation (LREC)},
    language     = {english},
}
@article{Wang2017,
    title        = {Tacotron: {A} Fully End-to-End Text-To-Speech Synthesis Model},
    author       = {Yuxuan Wang and R. J. Skerry{-}Ryan and Daisy Stanton and Yonghui Wu and Ron J. Weiss and Navdeep Jaitly and Zongheng Yang and Ying Xiao and Zhifeng Chen and Samy Bengio and Quoc V. Le and Yannis Agiomyrgiannakis and Rob Clark and Rif A. Saurous},
    year         = 2017,
    journal      = {CoRR},
    url          = {http://arxiv.org/abs/1703.10135},
    archiveprefix = {arXiv},
    eprint       = {1703.10135},
    timestamp    = {Mon, 13 Aug 2018 16:46:33 +0200},
    biburl       = {https://dblp.org/rec/bib/journals/corr/WangSSWWJYXCBLA17},
    bibsource    = {dblp computer science bibliography, https://dblp.org},
}
@inproceedings{Yamamoto2020,
    title        = {{Parallel Wavegan: A Fast Waveform Generation Model Based on Generative Adversarial Networks with Multi-Resolution Spectrogram}},
    author       = {Yamamoto, Ryuichi and Song, Eunwoo and Kim, Jae-Min},
    year         = 2020,
    month        = {May},
    booktitle    = {IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
    publisher    = {IEEE},
    pages        = {6199--6203},
    doi          = {10.1109/ICASSP40776.2020.9053795},
    issn         = {2379-190X},
}