Analyzing and Accessing Wikipedia as a Lexical Semantic Resource

Analyzing and Accessing Wikipedia as a Lexical Semantic Resource. Zesch, T., Gurevych, I., & Mühlhäuser, M. Data Structures for Linguistic Resources and Applications, Gunter Narr, Tübingen, 2007.

Website abstract bibtex

We analyze Wikipedia as a lexical semantic resource and compare it with conventional resources, such as dictionaries, thesauri, semantic wordnets, etc. Different parts of Wikipedia reflect different aspects of these resources. We show that Wikipedia contains a vast amount of knowledge about, e.g., named entities, domain specific terms, and rare word senses. If Wikipedia is to be used as a lexical semantic resource in large-scale NLP tasks, efficient programmatic access to the knowledge therein is required. We review existing access mechanisms and show that they are limited with respect to performance and the provided access functions. Therefore, we introduce a general purpose, high performance Java-based Wikipedia API that overcomes these limitations. It is available for research purposes at http://www.ukp.tu-darmstadt.de/software/WikipediaAPI.

@article{
 title = {Analyzing and Accessing Wikipedia as a Lexical Semantic Resource},
 type = {article},
 year = {2007},
 pages = {197-205},
 websites = {http://elara.tk.informatik.tu-darmstadt.de/Publications/2007/gldv07_10p.pdf},
 publisher = {Gunter Narr, Tübingen},
 institution = {Ubiquitous Knowledge Processing Group, Darmstadt University of Technology},
 editors = {[object Object],[object Object],[object Object]},
 id = {601d6f3a-48ef-3a44-ba9f-c889f85b908a},
 created = {2012-02-09T21:39:35.000Z},
 file_attached = {false},
 profile_id = {5284e6aa-156c-3ce5-bc0e-b80cf09f3ef6},
 group_id = {066b42c8-f712-3fc3-abb2-225c158d2704},
 last_modified = {2017-03-14T14:36:19.698Z},
 read = {false},
 starred = {false},
 authored = {false},
 confirmed = {true},
 hidden = {false},
 citation_key = {Zesch2007},
 private_publication = {false},
 abstract = {We analyze Wikipedia as a lexical semantic resource and compare it with conventional resources, such as dictionaries, thesauri, semantic wordnets, etc. Different parts of Wikipedia reflect different aspects of these resources. We show that Wikipedia contains a vast amount of knowledge about, e.g., named entities, domain specific terms, and rare word senses. If Wikipedia is to be used as a lexical semantic resource in large-scale NLP tasks, efficient programmatic access to the knowledge therein is required. We review existing access mechanisms and show that they are limited with respect to performance and the provided access functions. Therefore, we introduce a general purpose, high performance Java-based Wikipedia API that overcomes these limitations. It is available for research purposes at http://www.ukp.tu-darmstadt.de/software/WikipediaAPI.},
 bibtype = {article},
 author = {Zesch, Torsten and Gurevych, Iryna and Mühlhäuser, Max},
 journal = {Data Structures for Linguistic Resources and Applications},
 number = {March 2001}
}

Downloads: 0

{"_id":"FqZaPmupZfkyo2jKs","bibbaseid":"zesch-gurevych-mhlhuser-analyzingandaccessingwikipediaasalexicalsemanticresource-2007","authorIDs":[],"author_short":["Zesch, T.","Gurevych, I.","Mühlhäuser, M."],"bibdata":{"title":"Analyzing and Accessing Wikipedia as a Lexical Semantic Resource","type":"article","year":"2007","pages":"197-205","websites":"http://elara.tk.informatik.tu-darmstadt.de/Publications/2007/gldv07_10p.pdf","publisher":"Gunter Narr, Tübingen","institution":"Ubiquitous Knowledge Processing Group, Darmstadt University of Technology","editors":"[object Object],[object Object],[object Object]","id":"601d6f3a-48ef-3a44-ba9f-c889f85b908a","created":"2012-02-09T21:39:35.000Z","file_attached":false,"profile_id":"5284e6aa-156c-3ce5-bc0e-b80cf09f3ef6","group_id":"066b42c8-f712-3fc3-abb2-225c158d2704","last_modified":"2017-03-14T14:36:19.698Z","read":false,"starred":false,"authored":false,"confirmed":"true","hidden":false,"citation_key":"Zesch2007","private_publication":false,"abstract":"We analyze Wikipedia as a lexical semantic resource and compare it with conventional resources, such as dictionaries, thesauri, semantic wordnets, etc. Different parts of Wikipedia reflect different aspects of these resources. We show that Wikipedia contains a vast amount of knowledge about, e.g., named entities, domain specific terms, and rare word senses. If Wikipedia is to be used as a lexical semantic resource in large-scale NLP tasks, efficient programmatic access to the knowledge therein is required. We review existing access mechanisms and show that they are limited with respect to performance and the provided access functions. Therefore, we introduce a general purpose, high performance Java-based Wikipedia API that overcomes these limitations. It is available for research purposes at http://www.ukp.tu-darmstadt.de/software/WikipediaAPI.","bibtype":"article","author":"Zesch, Torsten and Gurevych, Iryna and Mühlhäuser, Max","journal":"Data Structures for Linguistic Resources and Applications","number":"March 2001","bibtex":"@article{\n title = {Analyzing and Accessing Wikipedia as a Lexical Semantic Resource},\n type = {article},\n year = {2007},\n pages = {197-205},\n websites = {http://elara.tk.informatik.tu-darmstadt.de/Publications/2007/gldv07_10p.pdf},\n publisher = {Gunter Narr, Tübingen},\n institution = {Ubiquitous Knowledge Processing Group, Darmstadt University of Technology},\n editors = {[object Object],[object Object],[object Object]},\n id = {601d6f3a-48ef-3a44-ba9f-c889f85b908a},\n created = {2012-02-09T21:39:35.000Z},\n file_attached = {false},\n profile_id = {5284e6aa-156c-3ce5-bc0e-b80cf09f3ef6},\n group_id = {066b42c8-f712-3fc3-abb2-225c158d2704},\n last_modified = {2017-03-14T14:36:19.698Z},\n read = {false},\n starred = {false},\n authored = {false},\n confirmed = {true},\n hidden = {false},\n citation_key = {Zesch2007},\n private_publication = {false},\n abstract = {We analyze Wikipedia as a lexical semantic resource and compare it with conventional resources, such as dictionaries, thesauri, semantic wordnets, etc. Different parts of Wikipedia reflect different aspects of these resources. We show that Wikipedia contains a vast amount of knowledge about, e.g., named entities, domain specific terms, and rare word senses. If Wikipedia is to be used as a lexical semantic resource in large-scale NLP tasks, efficient programmatic access to the knowledge therein is required. We review existing access mechanisms and show that they are limited with respect to performance and the provided access functions. Therefore, we introduce a general purpose, high performance Java-based Wikipedia API that overcomes these limitations. It is available for research purposes at http://www.ukp.tu-darmstadt.de/software/WikipediaAPI.},\n bibtype = {article},\n author = {Zesch, Torsten and Gurevych, Iryna and Mühlhäuser, Max},\n journal = {Data Structures for Linguistic Resources and Applications},\n number = {March 2001}\n}","author_short":["Zesch, T.","Gurevych, I.","Mühlhäuser, M."],"urls":{"Website":"http://elara.tk.informatik.tu-darmstadt.de/Publications/2007/gldv07_10p.pdf"},"bibbaseid":"zesch-gurevych-mhlhuser-analyzingandaccessingwikipediaasalexicalsemanticresource-2007","role":"author","downloads":0,"html":""},"bibtype":"article","creationDate":"2020-02-06T23:48:11.981Z","downloads":0,"keywords":[],"search_terms":["analyzing","accessing","wikipedia","lexical","semantic","resource","zesch","gurevych","mühlhäuser"],"title":"Analyzing and Accessing Wikipedia as a Lexical Semantic Resource","year":2007}