@inproceedings{2b340061c53a4d3b8c1efbfb736cdd5e,
title = "An Evaluation of Neural Vocoder-Based Voice Cloning System for Dysphonia Speech Disorder",
abstract = "Dysphonia is a voice disorder affecting voice quality, quantity, and intensity, occurring at various ages and diverse backgrounds. Dysphonia impacts the difficulty of communication, thereby reducing the overall quality of life. Medical solutions have been proposed to improve the speech quality of individuals with dysphonia. However, these solutions are often limited by considerable expenses and time-consuming procedures. Therefore, alternative solutions are needed to enhance speech quality. The widespread development of technology in various domains can be proposed as an alternative solution. One is speech processing technology using text-to-speech (TTS) with voice cloning techniques. Our work presents the impact of the vocoder in a voice cloning system on the quality of synthesized speech for dysphonia speakers. We compare selected vocoder models based on architecture and performance. Furthermore, we explore the effect of using Speaker Conditionals on the vocoder. We perform an objective evaluation for each vocoder to measure the quality of the models.",
keywords = "dysphonia, speech synthesis, text-to-speech, vocoder, voice cloning",
author = "Dhiya Dewangga and Dessi Lestari and Ayu Purwarianti and Dipta Tanaya and Kurniawati Azizah and Sakriani Sakti",
note = "Publisher Copyright: {\textcopyright} 2024 IEEE.; 27th Conference on the Oriental COCOSDA International Committee for the Co-Ordination and Standardisation of Speech Databases and Assessment Techniques, O-COCOSDA 2024 ; Conference date: 17-10-2024 Through 19-10-2024",
year = "2024",
doi = "10.1109/O-COCOSDA64382.2024.10800714",
language = "English",
series = "2024 27th Conference on the Oriental COCOSDA International Committee for the Co-Ordination and Standardisation of Speech Databases and Assessment Techniques, O-COCOSDA 2024 - Proceedings",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
editor = "Ming-Hsiang Su and Jui-Feng Yeh and Yuan-Fu Liao and Chi-Chun Lee and Yu Taso",
booktitle = "2024 27th Conference on the Oriental COCOSDA International Committee for the Co-Ordination and Standardisation of Speech Databases and Assessment Techniques, O-COCOSDA 2024 - Proceedings",
address = "United States",
}