@inproceedings{9dd0bc38fb984009b4be816fb28497f3,
title = "Generating hypergraph of term associations for automatic document concept clustering",
abstract = "This paper presents a novel approach to document clustering using hypergraph decomposition. Given a set of documents, the associations among frequently co-occurring terms in any of the documents define naturally a hypergraph, which can then be decomposed into connected components at various levels. Each connected component represents a primitive concept in the collection. The documents can then be clustered based on the primitive concepts. Experiments with three different data sets from web pages and medical literatures have shown that the proposed unsupervised clustering approach performs significantly better than traditional clustering algorithms, such as k-means, AutoClass and Hierarchical Clustering (HAC). The results indicate that hypergraphs are a perfect model to capture association rules in text and is very useful for automatic document clustering.",
keywords = "Association Rules, Concept, Connected Components, Decomposition, Document Clustering, Hypergraph",
author = "Chiang, {I. Jen} and Lin, {Tsau Young} and Hsu, {Jane Yung Jen}",
year = "2004",
language = "English",
isbn = "0889864586",
series = "Proceedings of the Eighth IASTED International Conference on Artificial Intelligence and Soft Computing",
pages = "181--186",
editor = "A.P. Pobil",
booktitle = "Proceedings of the Eighth IASTED International Conference On Artificial Intelligence and Soft Computing",
note = "Proceedings of the Eighth IASTED International Conference on Atificial Intelligence and Soft Computing ; Conference date: 01-09-2004 Through 03-09-2004",
}