@inproceedings{d815b457c78e4f0fba34c49eafc1259e,
title = "MoEVC: A Mixture of Experts Voice Conversion System with Sparse Gating Mechanism for Online Computation Acceleration",
abstract = "Owing to the recent advancements in deep learning technology, the performance of voice conversion (VC) in terms of quality and similarity has significantly improved. However, complex computation is generally required for deep-learning-based VC systems. This can cause a notable latency, which limits the deployment of such VC systems in real-world applications. Therefore, increasing the efficiency of online computing has become an important task. In this study, we propose a novel mixture-of-experts (MoE) based VC system, termed MoEVC. The MoEVC system uses a gating mechanism to assign weights to feature maps to increase VC performance. In addition, applying sparse constraints on the gating mechanism can skip some convolution processes through elimination of redundant feature maps, thereby accelerating online computing. Experimental results show that by using proper sparse constraints, we can effectively reduce the FLOPs (floating-point operations) count by 70%, while improving VC performance in both objective evaluation and human subjective listening tests.",
keywords = "Voice conversion, fully convolutional network, mixture of experts, non-parallel VC, variational autoencoder",
author = "Chang, {Yu Tao} and Yang, {Yuan Hong} and Peng, {Yu Huai} and Wang, {Syu Siang} and Tai-Shih Chi and Yu Tsao and Wang, {Hsin Min}",
note = "Publisher Copyright: {\textcopyright} 2021 IEEE.; 12th International Symposium on Chinese Spoken Language Processing, ISCSLP 2021 ; Conference date: 24-01-2021 Through 27-01-2021",
year = "2021",
month = jan,
day = "24",
doi = "10.1109/ISCSLP49672.2021.9362072",
language = "English",
series = "2021 12th International Symposium on Chinese Spoken Language Processing, ISCSLP 2021",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
booktitle = "2021 12th International Symposium on Chinese Spoken Language Processing, ISCSLP 2021",
address = "美國",
}