Mining classifications from social-ecological databases. Jensen, S., Chen, M., Liu, X., Plale, B., & Leake, D. Proceedings of the ASIST Annual Meeting, 2012.
doi  abstract   bibtex   
Social-ecological research is characteristic of long-tail science, with many region-specific studies of social and ecological phenomena that collectively yield a large volume of highly heterogeneous, small data sets. This variability makes it difficult to determine the applicability of a particular data set for a new research question, hindering the reuse of data that has been often collected through extensive effort. In this paper we present results of automatic classification of socio-ecological data into categories defined by a domain model called the SES Framework. We have applied our methods to the classification of a relational database containing over 18 years of research on forest systems. Our preliminary results suggest that decision tree-based classifiers along with textual features perform well at this task. Furthermore, social-ecological data sets are found to exhibit distinct classification features in that the results are promising even for classes that comprise a relatively small portion of the database.
@article{
 title = {Mining classifications from social-ecological databases},
 type = {article},
 year = {2012},
 volume = {49},
 id = {bb999551-9051-3fb9-9425-20180d23be0b},
 created = {2019-10-01T17:20:59.054Z},
 file_attached = {false},
 profile_id = {42d295c0-0737-38d6-8b43-508cab6ea85d},
 last_modified = {2019-10-01T17:23:57.181Z},
 read = {false},
 starred = {false},
 authored = {true},
 confirmed = {true},
 hidden = {false},
 citation_key = {Jensen2012},
 folder_uuids = {73f994b4-a3be-4035-a6dd-3802077ce863},
 private_publication = {false},
 abstract = {Social-ecological research is characteristic of long-tail science, with many region-specific studies of social and ecological phenomena that collectively yield a large volume of highly heterogeneous, small data sets. This variability makes it difficult to determine the applicability of a particular data set for a new research question, hindering the reuse of data that has been often collected through extensive effort. In this paper we present results of automatic classification of socio-ecological data into categories defined by a domain model called the SES Framework. We have applied our methods to the classification of a relational database containing over 18 years of research on forest systems. Our preliminary results suggest that decision tree-based classifiers along with textual features perform well at this task. Furthermore, social-ecological data sets are found to exhibit distinct classification features in that the results are promising even for classes that comprise a relatively small portion of the database.},
 bibtype = {article},
 author = {Jensen, S. and Chen, M. and Liu, X. and Plale, B. and Leake, D.},
 doi = {10.1002/meet.14504901301},
 journal = {Proceedings of the ASIST Annual Meeting},
 number = {1}
}

Downloads: 0