Optimal Baseline Corrections for Off-Policy Contextual Bandits. Gupta, S., Jeunen, O., Oosterhuis, H., & de Rijke, M. In RecSys 2024: 18th ACM Conference on Recommender Systems, October, 2024. ACM.
bibtex   
@inproceedings{gupta-2024-optimal,
	author = {Gupta, Shashank and Jeunen, Olivier and Oosterhuis, Harrie and de Rijke, Maarten},
	booktitle = {RecSys 2024: 18th ACM Conference on Recommender Systems},
	date-added = {2024-09-30 11:16:40 +0200},
	date-modified = {2024-09-30 11:16:40 +0200},
	month = {October},
	publisher = {ACM},
	title = {Optimal Baseline Corrections for Off-Policy Contextual Bandits},
	year = {2024}}

Downloads: 0