@article{579, keywords = {Imbalanced regression, Multi-objective evolutionary algorithms, Fuzzy rule-based systems}, author = {María Arteaga and María Gacto and Marta Galende and Jesus Alcala-Fdez and Rafael Alcalá}, title = {Enhancing soft computing techniques to actively address imbalanced regression problems}, abstract = {While research in the area of imbalance, which is understood as classes that are not equally represented, is mainly addressed in classification, it has hardly been studied in regression, where data maldistribution, or imbalance, can be defined as the existence of some specific subdomains of the output variable misrepresented in the training data set, resulting in low accuracy for new instances within these subdomains. The small amount of state-of-the-art techniques are “passive”, meaning they are only applied in preprocessing. In this contribution, we propose two new specific evolutionary algorithms based on fuzzy rules to “actively” address imbalanced regression problems and improve the overall performance of the algorithms instead of just addressing the imbalance problem. The results obtained after applying statistical tests to 32 regression datasets that handle more than 3000 partitions show the effectiveness of the proposed methods when compared to the best previous proposal, a passive method called SMOGN. We can conclude: (1) we cannot affirm, since the equality hypotheses have not been rejected, that there are significant performance differences between using stratified and non-stratified data, thus we will use stratification to preserve a minimum representation of the minority set, (2) both fuzzy rule-based methods obtain better results in terms of the imbalance metric when using SMOGN, but in both methods this incurs a cost in accuracy (with confidence scores of over 99.0\%), and (3) the proposed methods outperform those using SMOGN as they get slightly better results in the imbalance metric, with better average ranks in both proposals, and obtain significantly better results in global accuracy, that is, all the performance metrics studied improve statistically with a confidence score of over 99.0\%, with the exception of one metric, which scores above 90.0\%.}, year = {2023}, journal = {Expert Systems with Applications}, volume = {234}, pages = {121011}, issn = {0957-4174}, url = {https://www.sciencedirect.com/science/article/pii/S0957417423015130}, doi = {https://doi.org/10.1016/j.eswa.2023.121011}, }