@inproceedings{b99154ff305d45a79d06e19813f79427,
title = "Sparse data for document clustering",
abstract = "Document clustering which is a part of text mining framework is used to process models and real data collection of cancer documents into several groups. A vector space model of the documents based on their key phrases are formed and called sparse matrix which contains many zero values. A sparse dimensional reduction and several methods of clustering include K-means, Self Organizing and Non-negative Matrices Factorization (NMF) are applied to the data, then the results are compared. Sparse method in dimensional reduction step using Arnoldi Method provides a better result of clustering validity twice more than standard dimensional reduction result.",
keywords = "arnoldi method, competitive learning, k-means, non-negative matrices factorization, self-organizing, sparse",
author = "Ionia Veritawati and Ito Wasito and Mujiono",
year = "2013",
doi = "10.1109/ICoICT.2013.6574546",
language = "English",
isbn = "9781467349925",
series = "2013 International Conference of Information and Communication Technology, ICoICT 2013",
pages = "38--43",
booktitle = "2013 International Conference of Information and Communication Technology, ICoICT 2013",
note = "2013 International Conference of Information and Communication Technology, ICoICT 2013 ; Conference date: 20-03-2013 Through 22-03-2013",
}