The Distant Reader. Morgan, E., L., Abeysinghe, E., Pamidighantam, S., Coulter, E., Marru, S., & Pierce, M. In Proceedings of the Practice and Experience in Advanced Research Computing on Rise of the Machines (learning) - PEARC '19, pages 1-4, 2019. ACM Press.
The Distant Reader [link]Website  doi  abstract   bibtex   
The Distant Reader science gateway can be used to automatically create and analyze text corpora at a scale of thousands of user-supplied documents. These processing steps are deployed on a dynamic virtual cluster deployed on XSEDE's Jetstream academic cloud computing resource and are accessed through a Web interface. The science gateway uses Apache Airavata middleware to manage the interactions between the Web interface and the virtual clusters. The gateway leverages the Science Gateway Platform as a service (SciGaP) infrastructure at Indiana University, which provides user authentication, authorization, and identity management as well as access to the Distant Reader tools. The Distant Reader is designed to assist in the process of using & understanding corpora -- reading.
@inproceedings{
 title = {The Distant Reader},
 type = {inproceedings},
 year = {2019},
 pages = {1-4},
 websites = {http://dl.acm.org/citation.cfm?doid=3332186.3333260},
 publisher = {ACM Press},
 city = {New York, New York, USA},
 id = {1d3ad6d9-9f9a-31f3-ba1e-0169bab01e7f},
 created = {2019-10-01T17:20:20.775Z},
 accessed = {2019-08-19},
 file_attached = {true},
 profile_id = {42d295c0-0737-38d6-8b43-508cab6ea85d},
 last_modified = {2020-05-11T14:43:44.043Z},
 read = {false},
 starred = {false},
 authored = {true},
 confirmed = {true},
 hidden = {false},
 citation_key = {Morgan2019},
 private_publication = {false},
 abstract = {The Distant Reader science gateway can be used to automatically create and analyze text corpora at a scale of thousands of user-supplied documents. These processing steps are deployed on a dynamic virtual cluster deployed on XSEDE's Jetstream academic cloud computing resource and are accessed through a Web interface. The science gateway uses Apache Airavata middleware to manage the interactions between the Web interface and the virtual clusters. The gateway leverages the Science Gateway Platform as a service (SciGaP) infrastructure at Indiana University, which provides user authentication, authorization, and identity management as well as access to the Distant Reader tools. The Distant Reader is designed to assist in the process of using & understanding corpora -- reading.},
 bibtype = {inproceedings},
 author = {Morgan, Eric Lease and Abeysinghe, Eroma and Pamidighantam, Sudhkar and Coulter, Eric and Marru, Suresh and Pierce, Marlon},
 doi = {10.1145/3332186.3333260},
 booktitle = {Proceedings of the Practice and Experience in Advanced Research Computing on Rise of the Machines (learning) - PEARC '19}
}

Downloads: 0