@inbook{51023385bbca415f9274d9dd9c987835,
title = "High performance big data clustering",
abstract = "Scientific advances are collectively exploding the amount, diversity, and complexity of data becoming available. Our ability to collect huge amounts of data has greatly surpassed our analytical capacity to make sense of it. Efficient use of high performance computing techniques is critical for the success of the data-driven paradigm to scientific discovery. Data clustering is one of the fundamental analytics tasks heavily relied upon in many application domains, like astrohpysics, climate science, bioinformatics, etc. In this book chapter, we illustrate the challenges and opportunities in mining big data using two recently developed scalable parallel clustering algorithms. Experimental results on millions of high-dimensional data points clustered in parallel on thousands of processor cores are also presented.",
keywords = "big data, clustering, density-based clustering, hierarchical clustering",
author = "Ankit Agrawal and Patwary, {Md Mostofa Ali} and William Hendrix and Liao, {Wei Keng} and Alok Choudhary",
year = "2013",
doi = "10.3233/978-1-61499-322-3-192",
language = "English (US)",
isbn = "9781614993216",
series = "Advances in Parallel Computing",
publisher = "IOS Press BV",
pages = "192--211",
booktitle = "Cloud Computing and Big Data",
}