Comparative study of classifier performance using automatic feature construction by M3GP
Created by W.Langdon from
gp-bibliography.bib Revision:1.8051
- @InProceedings{Batista:2022:CEC,
-
author = "Joao E. Batista and Sara Silva",
-
title = "Comparative study of classifier performance using
automatic feature construction by {M3GP}",
-
booktitle = "2022 IEEE Congress on Evolutionary Computation (CEC)",
-
year = "2022",
-
editor = "Carlos A. Coello Coello and Sanaz Mostaghim",
-
address = "Padua, Italy",
-
month = "18-23 " # jul,
-
keywords = "genetic algorithms, genetic programming, M3GP, Python,
naive Bayes, decision trees, Support vector machines,
random forests, xgboost, Machine learning algorithms,
Computational modeling, Evolutionary computation,
Classification algorithms, Complexity theory, Feature
Construction, Multiclass Classification",
-
isbn13 = "978-1-6654-6708-7",
-
DOI = "doi:10.1109/CEC55065.2022.9870343",
-
code_url = "http://github.com/jespb/Python-M3GP",
-
size = "8 pages",
-
abstract = "The M3GP algorithm, originally designed to perform
multiclass classification with genetic programming, is
also a powerful feature construction method. Here we
explore its ability to evolve hyper-features that are
tailored not only to the problem to be solved, but also
to the learning algorithm that is used to solve it. We
pair M3GP with six different machine learning
algorithms and study its performance in eight
classification problems from different scientific
domains, with substantial variety in the number of
classes, features and samples. The results show that
automatic feature construction with M3GP, when compared
to using the standalone classifiers without feature
construction, achieves statistically significant
improvements in the majority of the test cases,
sometimes by a very large margin, while degrading the
weighted f-measure in only one out of 48 cases. We
observe the differences in the number and size of the
hyper-features evolved for each case, hypothesising
that the simpler the classifier, the larger the amount
of problem complexity is being captured in the
hyperfeatures. Our results also reveal that the M3GP
algorithm can be improved, both in execution time and
in model quality, by replacing its default classifier
with support vector machines or random forest
classifiers.",
-
notes = "Also known as \cite{9870343}",
- }
Genetic Programming entries for
Joao E Batista
Sara Silva
Citations