@inproceedings{0703af0a9a69457c974e0911d91e2b3f,
title = "Lightweight End-To-End Deep Learning Model For Music Source Separation",
abstract = "In this work, we propose a lightweight end-to-end music source separation deep learning model. Deep learning models for audio source separation based on time-domain have been proposed for end-to-end processing. However, the proposed models are complex and difficult to use when the computing resources of the device are limited. Additionally, long delays may be expected since long-term inputs are required to obtain adequate results for separation, making the models unsuitable for applications that require low latency. In the proposed model, Atrous Spatial Pyramid Pooling is used to reduce the number of parameters, and the receptive field preserving decoder is utilized to enhance the result of separation while the input context length is limited. The experimental results show that the proposed method obtains better results than previous methods while using 10% or fewer parameters.",
keywords = "Deep learning, lightweight, music source separation",
author = "Wang, {Yao Ting} and Lin, {Yi Xing} and Liang, {Kai Wen} and Tai, {Tzu Chiang} and Wang, {Jia Ching}",
note = "Publisher Copyright: {\textcopyright} 2022 IEEE.; 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022 ; Conference date: 11-12-2022 Through 14-12-2022",
year = "2022",
doi = "10.1109/ISCSLP57327.2022.10037912",
language = "???core.languages.en_GB???",
series = "2022 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "315--318",
editor = "Lee, {Kong Aik} and Hung-yi Lee and Yanfeng Lu and Minghui Dong",
booktitle = "2022 13th International Symposium on Chinese Spoken Language Processing, ISCSLP 2022",
}