@inproceedings{ca0c9abb21aa40a5b0235d6d4ccb854c,
title = "Frame selection in Si-DNN phonetic space with Wavenet vocoder for voice conversion without parallel training data",
abstract = "In this paper, we propose a frame selection approach to voice conversion with speaker independent deep neural network (SI-DNN) and Kullback-Leibler divergence (KLD). The acoustic difference between source and target speaker is equalized with SI-DNN in the ASR senone phonetic space. KLD is used as an ideal distortion measure to select the corresponding target frame given the source frame. Acoustic trajectory of the selected frames is rendered with maximum probability trajectory generation algorithm. WaveNet based vocoder is applied on the converted acoustic trajectory to get the final speech waveform. From the subjective results we find that 1) the proposed method can achieve better performance than the phonetic cluster based selection method [16]; 2) by applying WaveNet vocoder the naturalness and speaker similarity can be significantly improved compared with linear predictive coding (LPC) based vocoder; 3) WaveNet vocoder trained only with spectral features i.e., line spectrum pairs (LSP) can better maintain the pitch pattern towards target speaker than WaveNet vocoder trained with both spectral features i.e., LSP and prosodic features (F0 and Unvoiced/Voiced flag).",
keywords = "Deep neural network, Kullback-Leibler divergence, Voice conversion, WaveNet vocoder",
author = "Xie, \{Feng Long\} and Soong, \{Frank K.\} and Xi Wang and Lei He and Haifeng Li",
note = "Publisher Copyright: � 2018 IEEE; 11th International Symposium on Chinese Spoken Language Processing, ISCSLP 2018 ; Conference date: 26-11-2018 Through 29-11-2018",
year = "2018",
month = jul,
day = "2",
doi = "10.1109/ISCSLP.2018.8706660",
language = "英语",
series = "2018 11th International Symposium on Chinese Spoken Language Processing, ISCSLP 2018 - Proceedings",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "56--60",
booktitle = "2018 11th International Symposium on Chinese Spoken Language Processing, ISCSLP 2018 - Proceedings",
address = "美国",
}