Discriminative clustering of text documents (2002)
AUTHORS:
Peltonen Jaakko
,
Sinkkonen Janne,
Kaski Samuel
BOOKTITLE:
Proceedings of ICONIP'02, 9th International Conference on Neural Information Processing
PAGES:
1956-1960
URL:
http://ieeexplore.ieee.org/search/srchabstract.jsp?arnumber=1199015&isnumber=26990&punumber=8534&k2dockey=1199015@ieeecnfs&query=%28%28discriminative+clustering+of+text+documents%29%3Cin%3Emetadata%29&pos=0
@inproceedings{ Peltonen02iconip, editor = "Wang, Lipo and Rajapakse, Jagath C. and Fukushima, Kunihiko and Lee, Soo-Young and Yao, Xin", author = "Peltonen, Jaakko and Sinkkonen, Janne and Kaski, Samuel", publisher = "IEEE", title = "Discriminative clustering of text documents", vol = "4", booktitle = "Proceedings of ICONIP'02, 9th International Conference on Neural Information Processing", year = "2002", abstract = "Vector-space and distributional methods for text document clustering are discussed. Discriminative clustering, a recently proposed method, uses external data to find task-relevant characteristics of the documents, yet the clustering is defined even with no external data. We introduce a distributional version of discriminative clustering that represents text documents as probability distributions. The methods are tested in the task of clustering scientific document abstracts, and the ability of the methods to predict an independent topical classification of the abstracts is compared. The discriminative methods found topically more meaningful clusters than the vector space and distributional clustering models.", note = "Preprint postscript at \url{http://www.cis.hut.fi/projects/mi/papers/iconip02.ps.gz}", url = "http://ieeexplore.ieee.org/search/srchabstract.jsp?arnumber=1199015&isnumber=26990&punumber=8534&k2dockey=1199015@ieeecnfs&query=%28%28discriminative+clustering+of+text+documents%29%3Cin%3Emetadata%29&pos=0", flags = "AIRC copy", address = "Piscataway, NJ", impactfactor = "D3", pages = "1956-1960" }