@misc{10481/88641, year = {2022}, month = {1}, url = {https://hdl.handle.net/10481/88641}, abstract = {Finding a balance between diversity and convergence plays an important role in evolutionary algorithms to avoid premature convergence and to perform a better exploration of the search space. In the case of Genetic Programming, and more specifically for symbolic regression problems, different mechanisms have been devised to control diversity, ranging from novel crossover and/or mutation procedures to the design of distance measures that help genetic operators to increase diversity in the population. In this paper, we start from previous works where Straight Line Programs are used as an alternative representation to expression trees for symbolic regression, and develop a similarity measure based on edit distance in order to determine how different the Straight Line Programs in the population are. This measure is used in combination with the CHC algorithm strategy to control diversity in the population, and therefore to avoid local optima to solve symbolic regression problems. The proposal is first validated in a controlled scenario of benchmark datasets and it is compared with previous approaches to promote diversity in Genetic Programming. After that, the approach is also evaluated in a real world dataset of energy consumption data from a set of buildings of the University of Granada.}, organization = {PID2020-112495RB-C21}, organization = {B-TIC-42-UGR20}, publisher = {Elsevier}, keywords = {Diversity}, keywords = {Edit distance}, keywords = {Symbolic regression}, keywords = {Genetic Programming}, keywords = {Straight Line Program}, title = {A similarity measure for Straight Line Programs and its application to control diversity in Genetic Programming}, doi = {10.1016/j.eswa.2021.116415}, author = {Rueda Delgado, Ramón and Pegalajar Cuéllar, Manuel and Baca Ruiz, Luis Gonzaga and Pegalajar Jiménez, María Del Carmen}, }