@inproceedings{ca15f6efe6f0490fa8974d85049c5599,
title = "DenClust: A density based seed selection approach for K-Means",
abstract = "In this paper we present a clustering technique called Den-Clust that produces high quality initial seeds through a deterministicprocess without requiring an user input on the number of clusters k andthe radius of the clusters r. The high quality seeds are given input to K-Means as the set of initial seeds to produce the final clusters. DenClustuses a density based approach for initial seed selection. It calculates thedensity of each record, where the density of a record is the number ofrecords that have the minimum distances with the record. This approachis expected to produce high quality initial seeds for K-Means resultingin high quality clusters from a dataset. The performance of DenClust iscompared with five (5) existing techniques namely CRUDAW, AGCUK,Simple K-means (SK), Basic Farthest Point Heuristic (BFPH) and NewFarthest Point Heuristic (NFPH) in terms of three (3) external clusterevaluation criteria namely F-Measure, Entropy, Purity and two (2) in-ternal cluster evaluation criteria namely Xie-Beni Index (XB) and Sumof Square Error (SSE). We use three (3) natural datasets that we obtain from the UCI machine learning repository. DenClust performs better than all five existing techniques in terms of all five evaluation criteria forall three datasets used in this study.",
keywords = "Open access version available, Cluster Evaluation, Clustering, Data Mining, K-Means",
author = "Rahman, {Md Anisur} and Islam, {Md Zahidul} and Terence Bossomaier",
year = "2014",
doi = "10.1007/978-3-319-07176-3_68",
language = "English",
volume = "8468",
publisher = "Springer International Publishing",
pages = "784--795",
booktitle = "Artificial Intelligence and Soft Computing",
note = "International Conference on Artificial Intelligence and Soft Computing ; Conference date: 01-06-2014 Through 05-06-2014",
}