@inproceedings{65c75ccce86d420ea05ff4ddcde5aa87,
title = "CNMBI: Determining the Number of Clusters Using Center Pairwise Matching and Boundary Filtering",
abstract = "One of the main challenges in data mining is choosing the optimal number of clusters without prior information. Notably, existing methods are usually in the philosophy of cluster validation and hence have underlying assumptions on data distribution, which prevents their application to complex data such as large-scale images and high-dimensional data from the real world. In this regard, we propose an approach named CNMBI. Leveraging the distribution information inherent in the data space, we map the target task as a dynamic comparison process between cluster centers regarding positional behavior, without relying on the complete clustering results and designing the complex validity index as before. Bipartite graph theory is then employed to efficiently model this process. Additionally, we find that different samples have different confidence levels and thereby actively remove low-confidence ones, which is, for the first time to our knowledge, considered in cluster number determination. CNMBI is robust and allows for more flexibility in the dimension and shape of the target data (e.g., CIFAR-10 and STL-10). Extensive comparisof-the-art competitors on various challenging datasets demonstrate the superiority of our method.",
keywords = "Boundary filtering, Cluster center, Complex data, Number of clusters, Pairwise matching",
author = "Ruilin Zhang and Haiyang Zheng and Hongpeng Wang",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Switzerland AG 2023.; 19th International Conference on Advanced Data Mining and Applications, ADMA 2023 ; Conference date: 21-08-2023 Through 23-08-2023",
year = "2023",
doi = "10.1007/978-3-031-46677-9\_19",
language = "英语",
isbn = "9783031466762",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "262--277",
editor = "Xiaochun Yang and Bin Wang and Heru Suhartanto and Guoren Wang and Jing Jiang and Bing Li and Huaijie Zhu and Ningning Cui",
booktitle = "Advanced Data Mining and Applications - 19th International Conference, ADMA 2023, Proceedings",
address = "德国",
}