X-tract: Structure extraction from botanical textual descriptions. Abascal, R. & Sánchez, J., A. String Processing and Information Retrieval Symposium International Workshop on Groupware, Published by the IEEE Computer Society, 1999.
X-tract: Structure extraction from botanical textual descriptions [link]Website  abstract   bibtex   
Most available information today, both from printed books and digital repositories, is in the form of free-format texts. The task of retrieving information from these ever-growing repositories has become a challenge for information retrieval (IR) researchers. In some fields, such as Botany and Taxonomy, textual descriptions observe a set of rules and use a relatively limited vocabulary. This makes botanical textual descriptions an interesting area to explore IR techniques for finding structure and facilitating semantic analysis.This paper presents X-tract, a solution to the problem of text analysis and structure extraction in a specific application domain, namely floristic morphologic descriptions. The solution demonstrates the potential of using a grammar in the determination of information structure in a botanical digital library. We have developed a prototype based on this approach in which given an HTML or plain text, X-tract analyzes it and presents results to the user so he or she can verify the proposed structure before updating the database. This transformation is useful also in the process of storing morphologic descriptions in a database with a pre-established format. The solution is implemented in the context of the Floristic Digital Library (FDL), a large digital library project comprising a wide variety of botanical documents, formats and services.
@article{
 title = {X-tract: Structure extraction from botanical textual descriptions},
 type = {article},
 year = {1999},
 keywords = {botanical,create a digital,digital libraries,fdl,information extraction,library with information about,main objective,plants from various,project,x tract},
 pages = {2-7},
 websites = {http://www.computer.org/portal/web/csdl/doi/10.1109/SPIRE.1999.796571},
 publisher = {Published by the IEEE Computer Society},
 id = {9e338712-af06-333e-a327-cc0bd740bf75},
 created = {2011-12-29T19:53:53.000Z},
 file_attached = {false},
 profile_id = {5284e6aa-156c-3ce5-bc0e-b80cf09f3ef6},
 group_id = {066b42c8-f712-3fc3-abb2-225c158d2704},
 last_modified = {2017-03-14T14:36:19.698Z},
 read = {false},
 starred = {false},
 authored = {false},
 confirmed = {true},
 hidden = {false},
 citation_key = {Abascal1999},
 private_publication = {false},
 abstract = {Most available information today, both from printed books and digital repositories, is in the form of free-format texts. The task of retrieving information from these ever-growing repositories has become a challenge for information retrieval (IR) researchers. In some fields, such as Botany and Taxonomy, textual descriptions observe a set of rules and use a relatively limited vocabulary. This makes botanical textual descriptions an interesting area to explore IR techniques for finding structure and facilitating semantic analysis.This paper presents X-tract, a solution to the problem of text analysis and structure extraction in a specific application domain, namely floristic morphologic descriptions. The solution demonstrates the potential of using a grammar in the determination of information structure in a botanical digital library. We have developed a prototype based on this approach in which given an HTML or plain text, X-tract analyzes it and presents results to the user so he or she can verify the proposed structure before updating the database. This transformation is useful also in the process of storing morphologic descriptions in a database with a pre-established format. The solution is implemented in the context of the Floristic Digital Library (FDL), a large digital library project comprising a wide variety of botanical documents, formats and services.},
 bibtype = {article},
 author = {Abascal, Rocío and Sánchez, J Alfredo},
 journal = {String Processing and Information Retrieval Symposium International Workshop on Groupware}
}

Downloads: 0