@conference {790, title = {Agglomerative Constrained Clustering Through Similarity and Distance Recalculation}, booktitle = {International Conference on Hybrid Artificial Intelligence Systems}, year = {2020}, pages = {424-436}, abstract = {Constrained clustering has become a topic of considerable interest in machine learning, as it has been shown to produce promising results in domains where only partial information about how to solve the problem is available. Constrained clustering can be viewed as a semi-supervised generalization of clustering, which is traditionally unsupervised. It is able to leverage a new type of information encoded by constraints that guide the clustering process. In particular, this study focuses on instance-level must-link and cannot-link constraints. We propose an agglomerative constrained clustering algorithm, which combines distance-based and clustering-engine adapting methods to incorporate constraints into the partitioning process. It computes a similarity measure on the basis of distances (in the dataset) and constraints (in the constraint set) to later apply an agglomerative clustering method, whose clustering engine has been adapted to consider constraints and raw distances. We prove its capability to produce quality results for the constrained clustering problem by comparing its performance to previous proposals on several datasets with incremental levels of constraint-based information.}, keywords = {Agglomerative clustering, constrained clustering, Semi-supervised learning, Similarity recalculation}, doi = {https://doi.org/10.1007/978-3-030-61705-9_35}, author = {Germ{\'a}n Gonz{\'a}lez-Almagro and Juan Luis Suarez and Luengo, Juli{\'a}n and J. R. Cano and Garc{\'\i}a, Salvador} }