@inproceedings{451bda5b42a947c1bef182401a4b1a5f,
title = "Gaussian process based text categorization for healthy information",
abstract = "As the development of the medical technology, more and more people start to pay attention to their health. A large amount of health information can be easily obtained from the website now. Therefore, text categorization is important to analyze the information. In this work, we propose a system for text categorization that is based on a Gaussian process. Our proposed system involves the two parts- feature learning and classification. In the first part, we apply the latent Dirichlet allocation (LDA) to obtain the K latent topics proportion from each document. The K-dimensional vector is regarded as the feature of each document. In the classification part, a Gaussian process (GP) is utilized for the text categorization. 10 classes of text documents are categorized by the one-versus-one approach. The experimental results show that our proposed system performs well in text categorization, especially with the small size of training dataset.",
keywords = "classification, feature learning, Gaussian process, Latent Dirichlet Allocation, text categorization",
author = "Chen, {Sih Huei} and Lee, {Yuan Shan} and Tai, {Tzu Chiang} and Wang, {Jia Ching}",
note = "Publisher Copyright: {\textcopyright} 2015 IEEE.; 3rd International Conference on Orange Technologies, ICOT 2015 ; Conference date: 19-12-2015 Through 22-12-2015",
year = "2016",
month = jun,
day = "22",
doi = "10.1109/ICOT.2015.7498487",
language = "???core.languages.en_GB???",
series = "Proceedings of 2015 International Conference on Orange Technologies, ICOT 2015",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "30--33",
booktitle = "Proceedings of 2015 International Conference on Orange Technologies, ICOT 2015",
}