Towards Publishing Secure Capsule-Based Analysis. Murdock, J., Jett, J., Cole, T., Ma, Y., Downie, J., & Plale, B. In Proceedings of the ACM/IEEE Joint Conference on Digital Libraries, 2017.
doi  abstract   bibtex   
© 2017 IEEE. Computational engagement with the HathiTrust Digital Library (HTDL) is confounded by the in- copyright status and licensing restrictions on the majority of the content. Because of these limitations, computational analysis on the HTDL must either be carried out in a secure environment or on derivative datasets. The HathiTrust Research Center (HTRC) Data Capsule service provides researchers with a secure environment through which they invoke tools that create, analyze, and export non-consumptive datasets. These derivative datasets, so long as they do not reproduce the full-text of the original work, are a transformative work protected by Fair Use provisions of United States Copyright Law, and can be published for reuse by other researchers, as the HTRC Extracted Features Dataset has been. Secure environments and derivative datasets enable researchers to engage with restricted data from focused studies of a few dozen volumes to large- scale experiments on millions of volumes. This paper describes advances in the Capsule service through a case study of how the HTRC Data Capsule service has advanced our activities on provenance, workflows, worksets, and non-consumptive exports through a topic modeling example. We also discuss the potential applications of this Capsule-based model to other digital libraries wrestling with research access and copyright restrictions.
@inproceedings{
 title = {Towards Publishing Secure Capsule-Based Analysis},
 type = {inproceedings},
 year = {2017},
 id = {95ade062-b125-3dca-9cc9-e4a2ccbc381c},
 created = {2019-10-01T17:20:48.932Z},
 file_attached = {false},
 profile_id = {42d295c0-0737-38d6-8b43-508cab6ea85d},
 last_modified = {2019-10-01T17:23:26.309Z},
 read = {true},
 starred = {false},
 authored = {true},
 confirmed = {true},
 hidden = {false},
 citation_key = {Murdock2017},
 folder_uuids = {73f994b4-a3be-4035-a6dd-3802077ce863,3b35931e-fb6d-48f9-8e01-87ee16ef0331},
 private_publication = {false},
 abstract = {© 2017 IEEE. Computational engagement with the HathiTrust Digital Library (HTDL) is confounded by the in- copyright status and licensing restrictions on the majority of the content. Because of these limitations, computational analysis on the HTDL must either be carried out in a secure environment or on derivative datasets. The HathiTrust Research Center (HTRC) Data Capsule service provides researchers with a secure environment through which they invoke tools that create, analyze, and export non-consumptive datasets. These derivative datasets, so long as they do not reproduce the full-text of the original work, are a transformative work protected by Fair Use provisions of United States Copyright Law, and can be published for reuse by other researchers, as the HTRC Extracted Features Dataset has been. Secure environments and derivative datasets enable researchers to engage with restricted data from focused studies of a few dozen volumes to large- scale experiments on millions of volumes. This paper describes advances in the Capsule service through a case study of how the HTRC Data Capsule service has advanced our activities on provenance, workflows, worksets, and non-consumptive exports through a topic modeling example. We also discuss the potential applications of this Capsule-based model to other digital libraries wrestling with research access and copyright restrictions.},
 bibtype = {inproceedings},
 author = {Murdock, J. and Jett, J. and Cole, T. and Ma, Y. and Downie, J.S. and Plale, B.},
 doi = {10.1109/JCDL.2017.7991585},
 booktitle = {Proceedings of the ACM/IEEE Joint Conference on Digital Libraries}
}

Downloads: 0