SchemaTree: Maximum-Likelihood Property Recommendation for Wikidata. Gleim, L. C., Schimassek, R., Hüser, D., Peters, M., Krämer, C., Cochez, M., & Decker, S. In Harth, A., Kirrane, S., Ngonga Ngomo, A., Paulheim, H., Rula, A., Gentile, A. L., Haase, P., & Cochez, M., editors, The Semantic Web, pages 179–195, Cham, 2020. Springer International Publishing. abstract bibtex Wikidata is a free and open knowledge base which can be read and edited by both humans and machines. It acts as a central storage for the structured data of several Wikimedia projects. To improve the process of manually inserting new facts, the Wikidata platform features an association rule-based tool to recommend additional suitable properties. In this work, we introduce a novel approach to provide such recommendations based on frequentist inference. We introduce a trie-based method that can efficiently learn and represent property set probabilities in RDF graphs. We extend the method by adding type information to improve recommendation precision and introduce backoff strategies which further increase the performance of the initial approach for entities with rare property combinations. We investigate how the captured structure can be employed for property recommendation, analogously to the Wikidata PropertySuggester. We evaluate our approach on the full Wikidata dataset and compare its performance to the state-of-the-art Wikidata PropertySuggester, outperforming it in all evaluated metrics. Notably we could reduce the average rank of the first relevant recommendation by 71%.
@InProceedings{gleim2020schematree,
author="Gleim, Lars C.
and Schimassek, Rafael
and H{\"u}ser, Dominik
and Peters, Maximilian
and Kr{\"a}mer, Christoph
and Cochez, Michael
and Decker, Stefan",
editor="Harth, Andreas
and Kirrane, Sabrina
and Ngonga Ngomo, Axel-Cyrille
and Paulheim, Heiko
and Rula, Anisa
and Gentile, Anna Lisa
and Haase, Peter
and Cochez, Michael",
title="SchemaTree: Maximum-Likelihood Property Recommendation for {Wikidata}",
booktitle="The Semantic Web",
year="2020",
publisher="Springer International Publishing",
address="Cham",
pages="179--195",
abstract="Wikidata is a free and open knowledge base which can be read and edited by both humans and machines. It acts as a central storage for the structured data of several Wikimedia projects. To improve the process of manually inserting new facts, the Wikidata platform features an association rule-based tool to recommend additional suitable properties. In this work, we introduce a novel approach to provide such recommendations based on frequentist inference. We introduce a trie-based method that can efficiently learn and represent property set probabilities in RDF graphs. We extend the method by adding type information to improve recommendation precision and introduce backoff strategies which further increase the performance of the initial approach for entities with rare property combinations. We investigate how the captured structure can be employed for property recommendation, analogously to the Wikidata PropertySuggester. We evaluate our approach on the full Wikidata dataset and compare its performance to the state-of-the-art Wikidata PropertySuggester, outperforming it in all evaluated metrics. Notably we could reduce the average rank of the first relevant recommendation by 71{\%}.",
isbn="978-3-030-49461-2"
}
Downloads: 0
{"_id":"nQ32XZBLyLSv5YCM5","bibbaseid":"gleim-schimassek-hser-peters-krmer-cochez-decker-schematreemaximumlikelihoodpropertyrecommendationforwikidata-2020","author_short":["Gleim, L. C.","Schimassek, R.","Hüser, D.","Peters, M.","Krämer, C.","Cochez, M.","Decker, S."],"bibdata":{"bibtype":"inproceedings","type":"inproceedings","author":[{"propositions":[],"lastnames":["Gleim"],"firstnames":["Lars","C."],"suffixes":[]},{"propositions":[],"lastnames":["Schimassek"],"firstnames":["Rafael"],"suffixes":[]},{"propositions":[],"lastnames":["Hüser"],"firstnames":["Dominik"],"suffixes":[]},{"propositions":[],"lastnames":["Peters"],"firstnames":["Maximilian"],"suffixes":[]},{"propositions":[],"lastnames":["Krämer"],"firstnames":["Christoph"],"suffixes":[]},{"propositions":[],"lastnames":["Cochez"],"firstnames":["Michael"],"suffixes":[]},{"propositions":[],"lastnames":["Decker"],"firstnames":["Stefan"],"suffixes":[]}],"editor":[{"propositions":[],"lastnames":["Harth"],"firstnames":["Andreas"],"suffixes":[]},{"propositions":[],"lastnames":["Kirrane"],"firstnames":["Sabrina"],"suffixes":[]},{"propositions":[],"lastnames":["Ngonga","Ngomo"],"firstnames":["Axel-Cyrille"],"suffixes":[]},{"propositions":[],"lastnames":["Paulheim"],"firstnames":["Heiko"],"suffixes":[]},{"propositions":[],"lastnames":["Rula"],"firstnames":["Anisa"],"suffixes":[]},{"propositions":[],"lastnames":["Gentile"],"firstnames":["Anna","Lisa"],"suffixes":[]},{"propositions":[],"lastnames":["Haase"],"firstnames":["Peter"],"suffixes":[]},{"propositions":[],"lastnames":["Cochez"],"firstnames":["Michael"],"suffixes":[]}],"title":"SchemaTree: Maximum-Likelihood Property Recommendation for Wikidata","booktitle":"The Semantic Web","year":"2020","publisher":"Springer International Publishing","address":"Cham","pages":"179–195","abstract":"Wikidata is a free and open knowledge base which can be read and edited by both humans and machines. It acts as a central storage for the structured data of several Wikimedia projects. To improve the process of manually inserting new facts, the Wikidata platform features an association rule-based tool to recommend additional suitable properties. In this work, we introduce a novel approach to provide such recommendations based on frequentist inference. We introduce a trie-based method that can efficiently learn and represent property set probabilities in RDF graphs. We extend the method by adding type information to improve recommendation precision and introduce backoff strategies which further increase the performance of the initial approach for entities with rare property combinations. We investigate how the captured structure can be employed for property recommendation, analogously to the Wikidata PropertySuggester. We evaluate our approach on the full Wikidata dataset and compare its performance to the state-of-the-art Wikidata PropertySuggester, outperforming it in all evaluated metrics. Notably we could reduce the average rank of the first relevant recommendation by 71%.","isbn":"978-3-030-49461-2","bibtex":"@InProceedings{gleim2020schematree,\n\tauthor=\"Gleim, Lars C.\n\tand Schimassek, Rafael\n\tand H{\\\"u}ser, Dominik\n\tand Peters, Maximilian\n\tand Kr{\\\"a}mer, Christoph\n\tand Cochez, Michael\n\tand Decker, Stefan\",\n\teditor=\"Harth, Andreas\n\tand Kirrane, Sabrina\n\tand Ngonga Ngomo, Axel-Cyrille\n\tand Paulheim, Heiko\n\tand Rula, Anisa\n\tand Gentile, Anna Lisa\n\tand Haase, Peter\n\tand Cochez, Michael\",\n\ttitle=\"SchemaTree: Maximum-Likelihood Property Recommendation for {Wikidata}\",\n\tbooktitle=\"The Semantic Web\",\n\tyear=\"2020\",\n\tpublisher=\"Springer International Publishing\",\n\taddress=\"Cham\",\n\tpages=\"179--195\",\n\tabstract=\"Wikidata is a free and open knowledge base which can be read and edited by both humans and machines. It acts as a central storage for the structured data of several Wikimedia projects. To improve the process of manually inserting new facts, the Wikidata platform features an association rule-based tool to recommend additional suitable properties. In this work, we introduce a novel approach to provide such recommendations based on frequentist inference. We introduce a trie-based method that can efficiently learn and represent property set probabilities in RDF graphs. We extend the method by adding type information to improve recommendation precision and introduce backoff strategies which further increase the performance of the initial approach for entities with rare property combinations. We investigate how the captured structure can be employed for property recommendation, analogously to the Wikidata PropertySuggester. We evaluate our approach on the full Wikidata dataset and compare its performance to the state-of-the-art Wikidata PropertySuggester, outperforming it in all evaluated metrics. Notably we could reduce the average rank of the first relevant recommendation by 71{\\%}.\",\n\tisbn=\"978-3-030-49461-2\"\n}\n\n","author_short":["Gleim, L. C.","Schimassek, R.","Hüser, D.","Peters, M.","Krämer, C.","Cochez, M.","Decker, S."],"editor_short":["Harth, A.","Kirrane, S.","Ngonga Ngomo, A.","Paulheim, H.","Rula, A.","Gentile, A. L.","Haase, P.","Cochez, M."],"key":"gleim2020schematree","id":"gleim2020schematree","bibbaseid":"gleim-schimassek-hser-peters-krmer-cochez-decker-schematreemaximumlikelihoodpropertyrecommendationforwikidata-2020","role":"author","urls":{},"metadata":{"authorlinks":{}}},"bibtype":"inproceedings","biburl":"https://raw.githubusercontent.com/KRRVU/website/master/publications/krr.bib","dataSources":["H6xuGqu5uQ6rXhdJ4","jRiMQcLQ4TWHSS6Mc","dJmTXpbSWWjnxatYT","KenkBKiHAK4JSijXa"],"keywords":[],"search_terms":["schematree","maximum","likelihood","property","recommendation","wikidata","gleim","schimassek","hüser","peters","krämer","cochez","decker"],"title":"SchemaTree: Maximum-Likelihood Property Recommendation for Wikidata","year":2020}