A PAC-Bayesian Link Between Generalisation and Flat Minima. Haddouche, M., Viallard, P., Şimşekli, U., & Guedj, B. 2024. Submitted.Paper Pdf doi abstract bibtex 11 downloads Modern machine learning usually involves predictors in the overparametrised setting (number of trained parameters greater than dataset size), and their training yield not only good performances on training data, but also good generalisation capacity. This phenomenon challenges many theoretical results, and remains an open problem. To reach a better understanding, we provide novel generalisation bounds involving gradient terms. To do so, we combine the PAC-Bayes toolbox with Poincaré and Log-Sobolev inequalities, avoiding an explicit dependency on dimension of the predictor space. Our results highlight the positive influence of \emphflat minima (being minima with a neighbourhood nearly minimising the learning problem as well) on generalisation performances, involving directly the benefits of the optimisation phase.
@unpublished{haddouche2024pls,
title = {A PAC-Bayesian Link Between Generalisation and Flat Minima},
author = {Haddouche, Maxime and Viallard, Paul and Şimşekli, Umut and Guedj, Benjamin},
year = {2024},
note = "Submitted.",
abstract = {Modern machine learning usually involves predictors in the overparametrised setting (number of trained parameters greater than dataset size), and their training yield not only good performances on training data, but also good generalisation capacity. This phenomenon challenges many theoretical results, and remains an open problem. To reach a better understanding, we provide novel generalisation bounds involving gradient terms. To do so, we combine the PAC-Bayes toolbox with Poincaré and Log-Sobolev inequalities, avoiding an explicit dependency on dimension of the predictor space. Our results highlight the positive influence of \emph{flat minima} (being minima with a neighbourhood nearly minimising the learning problem as well) on generalisation performances, involving directly the benefits of the optimisation phase. },
url = {https://arxiv.org/abs/2402.08508},
url_PDF = {https://arxiv.org/pdf/2402.08508.pdf},
doi = {10.48550/ARXIV.2402.08508},
eprint={2402.08508},
archivePrefix={arXiv},
primaryClass={stat.ML},
copyright = {Creative Commons Attribution 4.0 International},
keywords={mine}
}
Downloads: 11
{"_id":"vmSiHMMQuPeXzW9KZ","bibbaseid":"haddouche-viallard-imekli-guedj-apacbayesianlinkbetweengeneralisationandflatminima-2024","author_short":["Haddouche, M.","Viallard, P.","Şimşekli, U.","Guedj, B."],"bibdata":{"bibtype":"unpublished","type":"unpublished","title":"A PAC-Bayesian Link Between Generalisation and Flat Minima","author":[{"propositions":[],"lastnames":["Haddouche"],"firstnames":["Maxime"],"suffixes":[]},{"propositions":[],"lastnames":["Viallard"],"firstnames":["Paul"],"suffixes":[]},{"propositions":[],"lastnames":["Şimşekli"],"firstnames":["Umut"],"suffixes":[]},{"propositions":[],"lastnames":["Guedj"],"firstnames":["Benjamin"],"suffixes":[]}],"year":"2024","note":"Submitted.","abstract":"Modern machine learning usually involves predictors in the overparametrised setting (number of trained parameters greater than dataset size), and their training yield not only good performances on training data, but also good generalisation capacity. This phenomenon challenges many theoretical results, and remains an open problem. To reach a better understanding, we provide novel generalisation bounds involving gradient terms. To do so, we combine the PAC-Bayes toolbox with Poincaré and Log-Sobolev inequalities, avoiding an explicit dependency on dimension of the predictor space. Our results highlight the positive influence of \\emphflat minima (being minima with a neighbourhood nearly minimising the learning problem as well) on generalisation performances, involving directly the benefits of the optimisation phase. ","url":"https://arxiv.org/abs/2402.08508","url_pdf":"https://arxiv.org/pdf/2402.08508.pdf","doi":"10.48550/ARXIV.2402.08508","eprint":"2402.08508","archiveprefix":"arXiv","primaryclass":"stat.ML","copyright":"Creative Commons Attribution 4.0 International","keywords":"mine","bibtex":"@unpublished{haddouche2024pls,\ntitle = {A PAC-Bayesian Link Between Generalisation and Flat Minima},\nauthor = {Haddouche, Maxime and Viallard, Paul and Şimşekli, Umut and Guedj, Benjamin},\nyear = {2024},\nnote = \"Submitted.\",\nabstract = {Modern machine learning usually involves predictors in the overparametrised setting (number of trained parameters greater than dataset size), and their training yield not only good performances on training data, but also good generalisation capacity. This phenomenon challenges many theoretical results, and remains an open problem. To reach a better understanding, we provide novel generalisation bounds involving gradient terms. To do so, we combine the PAC-Bayes toolbox with Poincaré and Log-Sobolev inequalities, avoiding an explicit dependency on dimension of the predictor space. Our results highlight the positive influence of \\emph{flat minima} (being minima with a neighbourhood nearly minimising the learning problem as well) on generalisation performances, involving directly the benefits of the optimisation phase. },\nurl = {https://arxiv.org/abs/2402.08508},\nurl_PDF = {https://arxiv.org/pdf/2402.08508.pdf},\ndoi = {10.48550/ARXIV.2402.08508},\neprint={2402.08508},\narchivePrefix={arXiv},\nprimaryClass={stat.ML},\ncopyright = {Creative Commons Attribution 4.0 International},\nkeywords={mine}\n}\n\n","author_short":["Haddouche, M.","Viallard, P.","Şimşekli, U.","Guedj, B."],"key":"haddouche2024pls","id":"haddouche2024pls","bibbaseid":"haddouche-viallard-imekli-guedj-apacbayesianlinkbetweengeneralisationandflatminima-2024","role":"author","urls":{"Paper":"https://arxiv.org/abs/2402.08508"," pdf":"https://arxiv.org/pdf/2402.08508.pdf"},"keyword":["mine"],"metadata":{"authorlinks":{}},"downloads":11,"html":""},"bibtype":"unpublished","biburl":"https://bguedj.github.io/files/bguedj-publications.bib","dataSources":["suE7RgYeZEnSYr5Fy"],"keywords":["mine"],"search_terms":["pac","bayesian","link","between","generalisation","flat","minima","haddouche","viallard","şimşekli","guedj"],"title":"A PAC-Bayesian Link Between Generalisation and Flat Minima","year":2024,"downloads":11}