A Kernel Perspective for Regularizing Deep Neural Networks. Bietti, A., Mialon, G., Chen, D., & Mairal, J. Technical Report arXiv:1810.00363, arXiv, May, 2019. arXiv:1810.00363 [cs, stat] type: article
A Kernel Perspective for Regularizing Deep Neural Networks [link]Paper  doi  abstract   bibtex   
We propose a new point of view for regularizing deep neural networks by using the norm of a reproducing kernel Hilbert space (RKHS). Even though this norm cannot be computed, it admits upper and lower approximations leading to various practical strategies. Specifically, this perspective (i) provides a common umbrella for many existing regularization principles, including spectral norm and gradient penalties, or adversarial training, (ii) leads to new effective regularization penalties, and (iii) suggests hybrid strategies combining lower and upper bounds to get better approximations of the RKHS norm. We experimentally show this approach to be effective when learning on small datasets, or to obtain adversarially robust models.
@techreport{bietti_kernel_2019,
	title = {A {Kernel} {Perspective} for {Regularizing} {Deep} {Neural} {Networks}},
	url = {http://arxiv.org/abs/1810.00363},
	abstract = {We propose a new point of view for regularizing deep neural networks by using the norm of a reproducing kernel Hilbert space (RKHS). Even though this norm cannot be computed, it admits upper and lower approximations leading to various practical strategies. Specifically, this perspective (i) provides a common umbrella for many existing regularization principles, including spectral norm and gradient penalties, or adversarial training, (ii) leads to new effective regularization penalties, and (iii) suggests hybrid strategies combining lower and upper bounds to get better approximations of the RKHS norm. We experimentally show this approach to be effective when learning on small datasets, or to obtain adversarially robust models.},
	number = {arXiv:1810.00363},
	urldate = {2022-05-23},
	institution = {arXiv},
	author = {Bietti, Alberto and Mialon, Grégoire and Chen, Dexiong and Mairal, Julien},
	month = may,
	year = {2019},
	doi = {10.48550/arXiv.1810.00363},
	note = {arXiv:1810.00363 [cs, stat]
type: article},
	keywords = {Computer Science - Machine Learning, Statistics - Machine Learning},
}

Downloads: 0