@inproceedings{51807ab419814df3a189ade02d34a6d5,
title = "An evaluation of the formal concept analysis-based document vector on document clustering",
abstract = "In conventional approaches, documents are represented by the vector whose dimensionalities are equivalent to the terms extracted from a document set. These approaches, called bag-of-term approaches, ignore the conceptual relationships between terms such as synonyms, hypernyms and hyponyms. In the past, researches have applied thesauri such as Word Net to solve this problem. However, thesauri such as Word Net are developed more for general purposes and are limited in specific domain. Therefore, an automatically built ontology for terms is desired. In our previous study, we proposed a method which applies formal concept analysis (FCA), an automatic ontology building method, to extract the term relationships from a document set, and then apply the extracted information as the ontology of terms to represent the documents as concept vectors. In order to evaluate the usability and effectiveness of the proposed method for information retrieval related applications, we employed the concept vectors generated for the documents to the document clustering. In this study, we apply bisecting k-means clustering and hierarchical agglomerative clustering as the platforms with which to evaluate our method.",
keywords = "Concept vector, Document clustering, Document vector, Formal concept analysis, Term ontology",
author = "Jehng, {Jihn Chang} and Shihchieh Chou and Cheng, {Chin Yi} and Heh, {Jia Sheng}",
year = "2011",
doi = "10.1109/ICCSA.2011.57",
language = "???core.languages.en_GB???",
isbn = "9780769544045",
series = "Proceedings - 2011 International Conference on Computational Science and Its Applications, ICCSA 2011",
pages = "207--210",
booktitle = "Proceedings - 2011 International Conference on Computational Science and Its Applications, ICCSA 2011",
note = "11th International Conference on Computational Science and Its Applications, ICCSA 2011 ; Conference date: 20-06-2011 Through 23-06-2011",
}