Improving experimental methods on success rates in evolutionary computation. Barrero, D., R-Moreno, M., & Camacho, D. Journal of Experimental and Theoretical Artificial Intelligence, 2017.
abstract   bibtex   
© 2016 Informa UK Limited, trading as Taylor & Francis Group. Due to the complexity of theoretical approaches in evolutionary computation (EC), research has being largely performed on experimental basis. One popular measure used by the EC community is the success rate (SR), which is used alone or as part of more complex measures such as Koza’s computational effort in genetic programming. A common practice in EC is to report just a punctual estimation of the SR, without additional information about its associated uncertainty. We aim to motivate EC researchers to adopt more rigorous practices when working with SRs. In particular, we introduce the importance of correctly reporting this measure and highlight its binomial nature. Unfortunately, this fact is usually overlooked in the literature. Considering the binomiality of the SR opens the whole corpus of binomial statistics to EA research and practice. In particular, we focus on studying several methods to compute SR confidence intervals, the factors that determine their quality in terms of coverage probability and interval length. Due to its practical interest, we also briefly discuss the number of required runs to build confidence intervals with a certain quality, providing a sound method to set the number of runs, one of the most important experimental settings in EC. Evidence suggests that Wilson is, on average, a reliable and simple method to bound an estimation of SR with confidence intervals, while the standard method, which is quite popular because of its conceptual simplicity, should be avoided in any case. However, other methods can also be of interest under certain circumstances. We encourage to report the number of trials and successes, as well as the interval, to ease further comparability of the results.
@article{
 title = {Improving experimental methods on success rates in evolutionary computation},
 type = {article},
 year = {2017},
 identifiers = {[object Object]},
 keywords = {Experimentation,confidence intervals,evolutionary computation,genetic programming,performance measures,success rate},
 volume = {29},
 id = {1e847b19-9abf-3730-aa97-ac4c44c4b290},
 created = {2019-03-18T15:00:28.553Z},
 file_attached = {false},
 profile_id = {77ead516-4fb7-3189-a920-09efa515b9dd},
 last_modified = {2019-03-18T15:00:28.553Z},
 read = {false},
 starred = {false},
 authored = {true},
 confirmed = {false},
 hidden = {false},
 private_publication = {false},
 abstract = {© 2016 Informa UK Limited, trading as Taylor  &  Francis Group. Due to the complexity of theoretical approaches in evolutionary computation (EC), research has being largely performed on experimental basis. One popular measure used by the EC community is the success rate (SR), which is used alone or as part of more complex measures such as Koza’s computational effort in genetic programming. A common practice in EC is to report just a punctual estimation of the SR, without additional information about its associated uncertainty. We aim to motivate EC researchers to adopt more rigorous practices when working with SRs. In particular, we introduce the importance of correctly reporting this measure and highlight its binomial nature. Unfortunately, this fact is usually overlooked in the literature. Considering the binomiality of the SR opens the whole corpus of binomial statistics to EA research and practice. In particular, we focus on studying several methods to compute SR confidence intervals, the factors that determine their quality in terms of coverage probability and interval length. Due to its practical interest, we also briefly discuss the number of required runs to build confidence intervals with a certain quality, providing a sound method to set the number of runs, one of the most important experimental settings in EC. Evidence suggests that Wilson is, on average, a reliable and simple method to bound an estimation of SR with confidence intervals, while the standard method, which is quite popular because of its conceptual simplicity, should be avoided in any case. However, other methods can also be of interest under certain circumstances. We encourage to report the number of trials and successes, as well as the interval, to ease further comparability of the results.},
 bibtype = {article},
 author = {Barrero, D.F. and R-Moreno, M.D. and Camacho, D.},
 journal = {Journal of Experimental and Theoretical Artificial Intelligence},
 number = {4}
}

Downloads: 0