Ryo Terashima, Ryuichi Yamamoto, Eunwoo Song, Yuma Shirahata, Hyun-Wook Yoon, Jae Min Kim, Kentaro Tachibana. Cross-Speaker Emotion Transfer for Low-Resource Text-to-Speech Using Non-Parallel Voice Conversion with Pitch-Shift Data Augmentation. In Hanseok Ko, John H. L. Hansen, editors, Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022. pages 3018-3022, ISCA, 2022. [doi]
@inproceedings{TerashimaYSSYKT22, title = {Cross-Speaker Emotion Transfer for Low-Resource Text-to-Speech Using Non-Parallel Voice Conversion with Pitch-Shift Data Augmentation}, author = {Ryo Terashima and Ryuichi Yamamoto and Eunwoo Song and Yuma Shirahata and Hyun-Wook Yoon and Jae Min Kim and Kentaro Tachibana}, year = {2022}, doi = {10.21437/Interspeech.2022-11278}, url = {https://doi.org/10.21437/Interspeech.2022-11278}, researchr = {https://researchr.org/publication/TerashimaYSSYKT22}, cites = {0}, citedby = {0}, pages = {3018-3022}, booktitle = {Interspeech 2022, 23rd Annual Conference of the International Speech Communication Association, Incheon, Korea, 18-22 September 2022}, editor = {Hanseok Ko and John H. L. Hansen}, publisher = {ISCA}, }