On the challenges of studying bias in Recommender Systems: The effect of data characteristics and algorithm configuration. Daniil, S., Slokom, M., Cuper, M., Liem, C., Ossenbruggen, J. v., & Hollink, L. Information Retrieval Research, 1(1):3–27, February, 2025. Number: 1
Paper doi abstract bibtex Statements on the propagation of bias by recommender systems are often hard to verify or falsify. Research on bias tends to draw from a small pool of publicly available datasets and is therefore bound by their specific properties. Additionally, implementation choices are often not explicitly described or motivated in research, while they may have an effect on bias propagation. In this paper, we explore the challenges of measuring and reporting popularity bias. We showcase the impact of data properties and algorithm configurations on popularity bias by combining real and synthetic data with well known recommender systems frameworks. First, we identify data characteristics that might impact popularity bias, and explore their presence in a set of available online datasets. Accordingly, we generate various datasets that combine these characteristics. Second, we locate algorithm configurations that vary across implementations in literature. We evaluate popularity bias for a number of datasets, three real and five synthetic, and configurations, and offer insights on their joint effect. We find that, depending on the data characteristics, various configurations of the algorithms examined can lead to different conclusions regarding the propagation of popularity bias. These results motivate the need for explicitly addressing algorithmic configuration and data properties when reporting and interpreting bias in recommender systems.
@article{daniil_challenges_2025,
title = {On the challenges of studying bias in {Recommender} {Systems}: {The} effect of data characteristics and algorithm configuration},
volume = {1},
copyright = {Copyright (c) 2025 Savvina Daniil, Manel Slokom, Mirjam Cuper, Cynthia Liem, Jacco van Ossenbruggen, Laura Hollink (Author)},
issn = {3050-9114},
shorttitle = {On the challenges of studying bias in {Recommender} {Systems}},
url = {https://irrj.org/article/view/19607},
doi = {10.54195/irrj.19607},
abstract = {Statements on the propagation of bias by recommender systems are often hard to verify or falsify. Research on bias tends to draw from a small pool of publicly available datasets and is therefore bound by their specific properties. Additionally, implementation choices are often not explicitly described or motivated in research, while they may have an effect on bias propagation. In this paper, we explore the challenges of measuring and reporting popularity bias. We showcase the impact of data properties and algorithm configurations on popularity bias by combining real and synthetic data with well known recommender systems frameworks. First, we identify data characteristics that might impact popularity bias, and explore their presence in a set of available online datasets. Accordingly, we generate various datasets that combine these characteristics. Second, we locate algorithm configurations that vary across implementations in literature. We evaluate popularity bias for a number of datasets, three real and five synthetic, and configurations, and offer insights on their joint effect. We find that, depending on the data characteristics, various configurations of the algorithms examined can lead to different conclusions regarding the propagation of popularity bias. These results motivate the need for explicitly addressing algorithmic configuration and data properties when reporting and interpreting bias in recommender systems.},
language = {en},
number = {1},
urldate = {2025-04-15},
journal = {Information Retrieval Research},
author = {Daniil, Savvina and Slokom, Manel and Cuper, Mirjam and Liem, Cynthia and Ossenbruggen, Jacco van and Hollink, Laura},
month = feb,
year = {2025},
note = {Number: 1},
pages = {3--27},
}
Downloads: 0
{"_id":"p5e4KQyEBcgTWBZYH","bibbaseid":"daniil-slokom-cuper-liem-ossenbruggen-hollink-onthechallengesofstudyingbiasinrecommendersystemstheeffectofdatacharacteristicsandalgorithmconfiguration-2025","author_short":["Daniil, S.","Slokom, M.","Cuper, M.","Liem, C.","Ossenbruggen, J. v.","Hollink, L."],"bibdata":{"bibtype":"article","type":"article","title":"On the challenges of studying bias in Recommender Systems: The effect of data characteristics and algorithm configuration","volume":"1","copyright":"Copyright (c) 2025 Savvina Daniil, Manel Slokom, Mirjam Cuper, Cynthia Liem, Jacco van Ossenbruggen, Laura Hollink (Author)","issn":"3050-9114","shorttitle":"On the challenges of studying bias in Recommender Systems","url":"https://irrj.org/article/view/19607","doi":"10.54195/irrj.19607","abstract":"Statements on the propagation of bias by recommender systems are often hard to verify or falsify. Research on bias tends to draw from a small pool of publicly available datasets and is therefore bound by their specific properties. Additionally, implementation choices are often not explicitly described or motivated in research, while they may have an effect on bias propagation. In this paper, we explore the challenges of measuring and reporting popularity bias. We showcase the impact of data properties and algorithm configurations on popularity bias by combining real and synthetic data with well known recommender systems frameworks. First, we identify data characteristics that might impact popularity bias, and explore their presence in a set of available online datasets. Accordingly, we generate various datasets that combine these characteristics. Second, we locate algorithm configurations that vary across implementations in literature. We evaluate popularity bias for a number of datasets, three real and five synthetic, and configurations, and offer insights on their joint effect. We find that, depending on the data characteristics, various configurations of the algorithms examined can lead to different conclusions regarding the propagation of popularity bias. These results motivate the need for explicitly addressing algorithmic configuration and data properties when reporting and interpreting bias in recommender systems.","language":"en","number":"1","urldate":"2025-04-15","journal":"Information Retrieval Research","author":[{"propositions":[],"lastnames":["Daniil"],"firstnames":["Savvina"],"suffixes":[]},{"propositions":[],"lastnames":["Slokom"],"firstnames":["Manel"],"suffixes":[]},{"propositions":[],"lastnames":["Cuper"],"firstnames":["Mirjam"],"suffixes":[]},{"propositions":[],"lastnames":["Liem"],"firstnames":["Cynthia"],"suffixes":[]},{"propositions":[],"lastnames":["Ossenbruggen"],"firstnames":["Jacco","van"],"suffixes":[]},{"propositions":[],"lastnames":["Hollink"],"firstnames":["Laura"],"suffixes":[]}],"month":"February","year":"2025","note":"Number: 1","pages":"3–27","bibtex":"@article{daniil_challenges_2025,\n\ttitle = {On the challenges of studying bias in {Recommender} {Systems}: {The} effect of data characteristics and algorithm configuration},\n\tvolume = {1},\n\tcopyright = {Copyright (c) 2025 Savvina Daniil, Manel Slokom, Mirjam Cuper, Cynthia Liem, Jacco van Ossenbruggen, Laura Hollink (Author)},\n\tissn = {3050-9114},\n\tshorttitle = {On the challenges of studying bias in {Recommender} {Systems}},\n\turl = {https://irrj.org/article/view/19607},\n\tdoi = {10.54195/irrj.19607},\n\tabstract = {Statements on the propagation of bias by recommender systems are often hard to verify or falsify. Research on bias tends to draw from a small pool of publicly available datasets and is therefore bound by their specific properties. Additionally, implementation choices are often not explicitly described or motivated in research, while they may have an effect on bias propagation. In this paper, we explore the challenges of measuring and reporting popularity bias. We showcase the impact of data properties and algorithm configurations on popularity bias by combining real and synthetic data with well known recommender systems frameworks. First, we identify data characteristics that might impact popularity bias, and explore their presence in a set of available online datasets. Accordingly, we generate various datasets that combine these characteristics. Second, we locate algorithm configurations that vary across implementations in literature. We evaluate popularity bias for a number of datasets, three real and five synthetic, and configurations, and offer insights on their joint effect. We find that, depending on the data characteristics, various configurations of the algorithms examined can lead to different conclusions regarding the propagation of popularity bias. These results motivate the need for explicitly addressing algorithmic configuration and data properties when reporting and interpreting bias in recommender systems.},\n\tlanguage = {en},\n\tnumber = {1},\n\turldate = {2025-04-15},\n\tjournal = {Information Retrieval Research},\n\tauthor = {Daniil, Savvina and Slokom, Manel and Cuper, Mirjam and Liem, Cynthia and Ossenbruggen, Jacco van and Hollink, Laura},\n\tmonth = feb,\n\tyear = {2025},\n\tnote = {Number: 1},\n\tpages = {3--27},\n}\n\n","author_short":["Daniil, S.","Slokom, M.","Cuper, M.","Liem, C.","Ossenbruggen, J. v.","Hollink, L."],"key":"daniil_challenges_2025","id":"daniil_challenges_2025","bibbaseid":"daniil-slokom-cuper-liem-ossenbruggen-hollink-onthechallengesofstudyingbiasinrecommendersystemstheeffectofdatacharacteristicsandalgorithmconfiguration-2025","role":"author","urls":{"Paper":"https://irrj.org/article/view/19607"},"metadata":{"authorlinks":{}}},"bibtype":"article","biburl":"https://api.zotero.org/users/6655/collections/3TB3KT36/items?key=VFvZhZXIoHNBbzoLZ1IM2zgf&format=bibtex&limit=100","dataSources":["7KNAjxiv2tsagmbgY"],"keywords":[],"search_terms":["challenges","studying","bias","recommender","systems","effect","data","characteristics","algorithm","configuration","daniil","slokom","cuper","liem","ossenbruggen","hollink"],"title":"On the challenges of studying bias in Recommender Systems: The effect of data characteristics and algorithm configuration","year":2025}