
@Article{cmc.2025.057693,
AUTHOR = {Yuan Ping, Huina Li, Chun Guo, Bin Hao},
TITLE = {<i>k</i>ProtoClust: Towards Adaptive <i>k</i>-Prototype Clustering without Known <i>k</i>},
JOURNAL = {Computers, Materials \& Continua},
VOLUME = {82},
YEAR = {2025},
NUMBER = {3},
PAGES = {4949--4976},
URL = {http://www.techscience.com/cmc/v82n3/59875},
ISSN = {1546-2226},
ABSTRACT = {Towards optimal <i>k</i>-prototype discovery, <i>k</i>-means-like algorithms give us inspirations of central samples collection, yet the unstable seed samples selection, the hypothesis of a circle-like pattern, and the unknown <i>K</i> are still challenges, particularly for non-predetermined data patterns. We propose an adaptive <i>k</i>-prototype clustering method (<i>k</i>ProtoClust) which launches cluster exploration with a sketchy division of <i>K</i> clusters and finds evidence for splitting and merging. On behalf of a group of data samples, support vectors and outliers from the perspective of support vector data description are not the appropriate candidates for prototypes, while inner samples become the first candidates for instability reduction of seeds. Different from the representation of samples in traditional, we extend sample selection by encouraging fictitious samples to emphasize the representativeness of patterns. To get out of the circle-like pattern limitation, we introduce a convex decomposition-based strategy of one-cluster-multiple-prototypes in which convex hulls of varying sizes are prototypes, and accurate connection analysis makes the support of arbitrary cluster shapes possible. Inspired by geometry, the three presented strategies make <i>k</i>ProtoClust bypassing the <i>K</i> dependence well with the global and local position relationship analysis for data samples. Experimental results on twelve datasets of irregular cluster shape or high dimension suggest that <i>k</i>ProtoClust handles arbitrary cluster shapes with prominent accuracy even without the prior knowledge <i>K</i>.},
DOI = {10.32604/cmc.2025.057693}
}



