Seeded discovery of base relations in large corpora. Andrews, N. & Ramakrishnan, N. Proceedings of the Conference on Empirical Methods in Natural Language Processing EMNLP 08, Association for Computational Linguistics, 2008.
Seeded discovery of base relations in large corpora [link]Website  abstract   bibtex   
Relationship discovery is the task of identifying salient relationships between named entities in text. We propose novel approaches for two sub-tasks of the problem: identifying the entities of interest, and partitioning and describing the relations based on their semantics. In particular, we show that term frequency patterns can be used effectively instead of supervised NER, and that the p-median clustering objective function naturally uncovers relation exemplars appropriate for describing the partitioning. Furthermore, we introduce a novel application of relationship discovery: the unsupervised identification of protein-protein interaction phrases.
@article{
 title = {Seeded discovery of base relations in large corpora},
 type = {article},
 year = {2008},
 identifiers = {[object Object]},
 pages = {591-599},
 websites = {http://portal.acm.org/citation.cfm?doid=1613715.1613788},
 publisher = {Association for Computational Linguistics},
 id = {35620152-463d-3ffc-b7bb-071b6fa45dd5},
 created = {2011-12-28T07:04:55.000Z},
 file_attached = {false},
 profile_id = {5284e6aa-156c-3ce5-bc0e-b80cf09f3ef6},
 group_id = {066b42c8-f712-3fc3-abb2-225c158d2704},
 last_modified = {2017-03-14T14:36:19.698Z},
 tags = {named entities,relation extraction},
 read = {false},
 starred = {false},
 authored = {false},
 confirmed = {true},
 hidden = {false},
 citation_key = {Andrews2008},
 private_publication = {false},
 abstract = {Relationship discovery is the task of identifying salient relationships between named entities in text. We propose novel approaches for two sub-tasks of the problem: identifying the entities of interest, and partitioning and describing the relations based on their semantics. In particular, we show that term frequency patterns can be used effectively instead of supervised NER, and that the p-median clustering objective function naturally uncovers relation exemplars appropriate for describing the partitioning. Furthermore, we introduce a novel application of relationship discovery: the unsupervised identification of protein-protein interaction phrases.},
 bibtype = {article},
 author = {Andrews, Nicholas and Ramakrishnan, Naren},
 journal = {Proceedings of the Conference on Empirical Methods in Natural Language Processing EMNLP 08},
 number = {October}
}

Downloads: 0