Fighting Underspecification in Symbolic Regression with Fitness Sharing
Created by W.Langdon from
gp-bibliography.bib Revision:1.8051
- @InProceedings{de-franca:2023:GECCOcomp,
-
author = "Fabricio {Olivetti De Franca}",
-
title = "Fighting Underspecification in Symbolic Regression
with Fitness Sharing",
-
booktitle = "Proceedings of the 2023 Genetic and Evolutionary
Computation Conference",
-
year = "2023",
-
editor = "Sara Silva and Luis Paquete and Leonardo Vanneschi and
Nuno Lourenco and Ales Zamuda and Ahmed Kheiri and
Arnaud Liefooghe and Bing Xue and Ying Bi and
Nelishia Pillay and Irene Moser and Arthur Guijt and
Jessica Catarino and Pablo Garcia-Sanchez and
Leonardo Trujillo and Carla Silva and Nadarajen Veerapen",
-
pages = "551--554",
-
address = "Lisbon, Portugal",
-
series = "GECCO '23",
-
month = "15-19 " # jul,
-
organisation = "SIGEVO",
-
publisher = "Association for Computing Machinery",
-
publisher_address = "New York, NY, USA",
-
keywords = "genetic algorithms, genetic programming, regression,
symbolic regression: Poster",
-
isbn13 = "9798400701191",
-
DOI = "doi:10.1145/3583133.3590525",
-
size = "4 pages",
-
abstract = "Underspecification happens when there are different
plausible hypotheses for a training and validation data
set that behave differently when evaluating outside the
training domain or distribution. Symbolic regression
algorithms are prone to underspecification because of
the additional degree of freedom of having to specify
the structural component of the regression model. When
facing different likely alternatives, some algorithms
use the Occam's razor principle of choosing the
simplest alternative. But not only there is no
guarantee that this is the correct decision but the
definition of simplest in symbolic regression is also
subjective. In this work we analyse the use diversity
control mechanisms to help fight the underspecification
problem by providing to the end-user multiple
alternative models in a single execution. These
alternative models can be used in a post-analysis
process when the practitioner has additional knowledge.
For this purpose, we implemented a fitness sharing
mechanism in the Transformation-Interaction-Rational
Symbolic Regression algorithm with a distance function
that measures how different two models behave outside
the domain of the training data. The results showed
that this adaptation is capable of producing multiple
alternatives with similar fitness but with distinct
behavior outside this domain.",
-
notes = "GECCO-2023 A Recombination of the 32nd International
Conference on Genetic Algorithms (ICGA) and the 28th
Annual Genetic Programming Conference (GP)",
- }
Genetic Programming entries for
Fabricio Olivetti de Franca
Citations