@inproceedings{94f4cd22dae14d8f8f15db0998b7adb9,
title = "Incorporating local environment information with ensemble neural networks to robust automatic speech recognition",
abstract = "This paper proposes an ensemble neural network (ENN) framework for robust automatic speech recognition (ASR). The proposed ENN framework can be divided into offline and online phases. In the offline phase, the ENN framework first applies an environment clustering technique to partition the training data into several subsets, where each subset characterizes specific local information of the entire acoustic space. Next, each subset of training data is adopted to train an NN acoustic model. Finally, the entire set of training data is used to estimate a gating function, which can determine the most suitable NN acoustic model given an input utterance. In the online phase, given the testing utterance, the gating function specifies the optimal NN acoustic model to perform speech recognition. Because local environment information is incorporated, ENN can effectively determine the NN acoustic model that optimally matches the testing condition. The proposed framework was evaluated on the Aurora-2 task. Experimental results show that the proposed ENN framework can provide a notable word error rate reduction of 5.35% (from 5.05% to 4.78%) when compared to the baseline.",
keywords = "Ensemble neural network, Environment clustering, Mixture of local experts, Robust ASR",
author = "Hsu, {Chia Yung} and Zezario, {Ryandhimas E.} and Wang, {Jia Ching} and Ho, {Chin Wen} and Xugang Lu and Yu Tsao",
note = "Publisher Copyright: {\textcopyright} 2016 IEEE.; 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016 ; Conference date: 17-10-2016 Through 20-10-2016",
year = "2017",
month = may,
day = "2",
doi = "10.1109/ISCSLP.2016.7918489",
language = "???core.languages.en_GB???",
series = "Proceedings of 2016 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
editor = "Hsin-Min Wang and Qingzhi Hou and Yuan Wei and Tan Lee and Jianguo Wei and Lei Xie and Hui Feng and Jianwu Dang and Jianwu Dang",
booktitle = "Proceedings of 2016 10th International Symposium on Chinese Spoken Language Processing, ISCSLP 2016",
}