Extraction of Informative Expressions from Domain-specific Documents. Yamamoto, E., Isahara, H., Terada, A., & Abe, Y. In Proceedings of the 6th international Conference on Language Resources and Evaluation (2008), pages 1611-1618, 2008. European Language Resources Association (ELRA).
Extraction of Informative Expressions from Domain-specific Documents [link]Website  abstract   bibtex   
What kinds of lexical resources are helpful for extracting useful information from domain-specific documents? Although domain-specific documents contain much useful knowledge, it is not obvious how to extract such knowledge efficiently from the documents. We need to develop techniques for extracting hidden information from such domain-specific documents. These techniques do not necessarily use state-of-the-art technologies and achieve deep and accurate language understanding, but are based on huge amounts of linguistic resources, such as domain-specific lexical databases. In this paper, we introduce two techniques for extracting informative expressions from documents: the extraction of related words that are not only taxonomically related but also thematically related, and the acquisition of salient terms and phrases. With these techniques we then attempt to automatically and statistically extract domain-specific informative expressions in aviation documents as an example and evaluate the results.
@inProceedings{
 title = {Extraction of Informative Expressions from Domain-specific Documents},
 type = {inProceedings},
 year = {2008},
 identifiers = {[object Object]},
 pages = {1611-1618},
 websites = {http://www.lrec-conf.org/proceedings/lrec2008/},
 publisher = {European Language Resources Association (ELRA)},
 editors = {[object Object],[object Object],[object Object],[object Object],[object Object],[object Object],[object Object]},
 id = {dd69028b-e61f-3ed5-b4df-9af778b2c5cb},
 created = {2011-12-29T19:53:53.000Z},
 file_attached = {false},
 profile_id = {5284e6aa-156c-3ce5-bc0e-b80cf09f3ef6},
 group_id = {066b42c8-f712-3fc3-abb2-225c158d2704},
 last_modified = {2017-03-14T14:36:19.698Z},
 read = {false},
 starred = {false},
 authored = {false},
 confirmed = {true},
 hidden = {false},
 citation_key = {Yamamoto2008},
 private_publication = {false},
 abstract = {What kinds of lexical resources are helpful for extracting useful information from domain-specific documents? Although domain-specific documents contain much useful knowledge, it is not obvious how to extract such knowledge efficiently from the documents. We need to develop techniques for extracting hidden information from such domain-specific documents. These techniques do not necessarily use state-of-the-art technologies and achieve deep and accurate language understanding, but are based on huge amounts of linguistic resources, such as domain-specific lexical databases. In this paper, we introduce two techniques for extracting informative expressions from documents: the extraction of related words that are not only taxonomically related but also thematically related, and the acquisition of salient terms and phrases. With these techniques we then attempt to automatically and statistically extract domain-specific informative expressions in aviation documents as an example and evaluate the results.},
 bibtype = {inProceedings},
 author = {Yamamoto, Eiko and Isahara, Hitoshi and Terada, Akira and Abe, Yasunori},
 booktitle = {Proceedings of the 6th international Conference on Language Resources and Evaluation (2008)}
}

Downloads: 0