@inproceedings{1a17d341674d450eb0292029e90dc155,
title = "M-BIRCH: An online clustering approach for computer vision applications",
abstract = "We adapt a classic online clustering algorithm called Balanced Iterative Reducing and Clustering using Hierarchies (BIRCH), to incrementally cluster large datasets of features commonly used in multimedia and computer vision. We call the adapted version modified-BIRCH (m-BIRCH). The algorithm uses only a fraction of the dataset memory to perform clustering, and updates the clustering decisions when new data comes in. Modifications made in m-BIRCH enable data driven parameter selection and effectively handle varying density regions in the feature space. Data driven parameter selection automatically controls the level of coarseness of the data summarization. Effective handling of varying density regions is necessary to well represent the different density regions in data summarization. We use m-BIRCH to cluster 840K color SIFT descriptors, and 60K outlier corrupted grayscale patches. We use the algorithm to cluster datasets consisting of challenging non-convex clustering patterns. Our implementation of the algorithm provides an useful clustering tool and is made publicly available.",
keywords = "Automatic Threshold Selection, BIRCH, Computer Vision, Online clustering, Outlier Detection",
author = "Madan, {Siddharth K.} and Dana, {Kristin J.}",
note = "Publisher Copyright: {\textcopyright} 2015 SPIE-IS&T.; Imaging and Multimedia Analytics in a Web and Mobile World 2015 ; Conference date: 11-02-2015 Through 12-02-2015",
year = "2015",
doi = "10.1117/12.2078264",
language = "English (US)",
series = "Proceedings of SPIE - The International Society for Optical Engineering",
publisher = "SPIE",
editor = "Allebach, {Jan P.} and Zhigang Fan and Qian Lin",
booktitle = "Proceedings of SPIE-IS and T Electronic Imaging - Imaging and Multimedia Analytics in a Web and Mobile World 2015",
address = "United States",
}