@inproceedings{611523d6937a42d99d97a5a0720c9202,
title = "Self-supervised Learning and Masked Language Model for Code-switching Automatic Speech Recognition",
abstract = "Code-switching (CS) is a common linguistic phenomenon that poses significant challenges for automatic speech recognition systems due to the lack of corpus. In this paper, we propose a novel approach to address this challenge by leveraging self-supervised learning (SSL) and the masked language model (MLM) in speech recognition. Specifically, we use the wav2vec 2.0 pre-trained model to reduce the dependency on CS labeled data, and the MLM to rerank sentences generated using beam search decoding. Our proposed method is evaluated on the SEAME dataset, and experimental results show that it outperforms state-of-the-art CS speech recognition approaches by 15.6% and 19.9% in terms of token error rates (TER). Moreover, the proposed method is generalizable and can be extended to other CS languages. These results demonstrate the effectiveness of our approach and its potential for future research in the field of CS speech recognition.",
keywords = "code-switching, masked language modeling, self-supervised learning, speech recognition",
author = "Chen, {Po Kai} and Fu, {Li Yeh} and Chen, {Cheng Kai} and Lin, {Yi Xing} and Chen, {Chih Ping} and Huang, {Chien Lin} and Wang, {Jia Ching}",
note = "Publisher Copyright: {\textcopyright} 2024 IEEE.; 10th IEEE International Conference on Communications and Electronics, ICCE 2024 ; Conference date: 31-07-2024 Through 02-08-2024",
year = "2024",
doi = "10.1109/ICCE62051.2024.10634607",
language = "???core.languages.en_GB???",
series = "ICCE 2024 - 2024 IEEE 10th International Conference on Communications and Electronics",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "387--391",
editor = "Jeong, {Seong Ho} and Loc, {Ho Dac} and Serge Fdida and Tho Le-Ngoc",
booktitle = "ICCE 2024 - 2024 IEEE 10th International Conference on Communications and Electronics",
}