@inproceedings{80c42f8ec0ef4a5796cd7fc3ad492dd1,
title = "類神經網路訓練結合環境群集及專家混合系統於強健性語音辨識",
abstract = "Recently, automatic speech recognition (ASR) using neural network (NN) based acoustic model (AM) has achieved significant improvements. However, the mismatch (including speaker and speaking environment) of training and testing conditions still confines the applicability of ASR. This paper proposes a novel approach that combines the environment clustering (EC) and mixture of experts (MOE) algorithms (thus the proposed approach is termed EC-MOE) to enhance the robustness of ASR against mismatches. In the offline phase, we split the entire training set into several subsets, with each subset characterizing a specific speaker and speaking environment. Then, we use each subset of training data to prepare an NN-based AM. In the online phase, we use a Gaussian mixture model (GMM)-gate to determine the optimal output from the multiple NN-based AMs to render the final recognition results. We evaluated the proposed EC-MOE approach on the Aurora 2 continuous digital speech recognition task. Comparing to the baseline system, where only a single NN-based AM is used for recognition, the proposed approach achieves a clear word error rate (WER) reduction of 5.9 % (5.25% to 4.94%).",
keywords = "Environment clustering, Mixture of experts, Neural network, Robust speech recognition",
author = "Hsu, {Chia Yung} and Wang, {Jia Ching} and Yu Tsao",
note = "Publisher Copyright: {\textcopyright} The Association for Computational Linguistics and Chinese Language Processing.; 27th Conference on Computational Linguistics and Speech Processing, ROCLING 2015 ; Conference date: 01-10-2015 Through 02-10-2015",
year = "2015",
month = oct,
day = "1",
language = "繁體中文",
series = "Proceedings of the 27th Conference on Computational Linguistics and Speech Processing, ROCLING 2015",
publisher = "The Association for Computational Linguistics and Chinese Language Processing (ACLCLP)",
pages = "136--147",
editor = "Sin-Horng Chen and Hsin-Min Wang and Jen-Tzung Chien and Hung-Yu Kao and Wen-Whei Chang and Yih-Ru Wang and Shih-Hung Wu",
booktitle = "Proceedings of the 27th Conference on Computational Linguistics and Speech Processing, ROCLING 2015",
}