Parallel and quantitative sequential pattern mining for large-scale interval-based temporal data. Ruan, G., Zhang, H., & Plale, B. In Proceedings - 2014 IEEE International Conference on Big Data, IEEE Big Data 2014, 2015.
doi  abstract   bibtex   
© 2014 IEEE. Mining frequent subsequences of patterns, or sequential pattern mining, has wide application in customer shopping sequence analysis, web log stream analysis, multi-modal behavioral studies, to name a few. To detect unknown, anomalous, and unexpected patterns from large-scale interval-based temporal data without complete a priori knowledge is challenging. In this paper, we present a framework - PESMiner which allows parallel and quantitative mining of sequential patterns at scale. Whereas most existing sequential mining algorithms can only find sequential orders of temporal events, our work presents a novel interactive temporal data mining algorithm capable of extracting precise temporal properties of sequential patterns. Furthermore, our work provides a unified parallel solution that scales our algorithms to larger temporal data sets by exploiting iterative MapReduce tasks. Comprehensive performance evaluations demonstrate that PESMiner significantly outperforms existing interval-based mining algorithms in terms of both quality (i.e. accuracy, precision, and recall) and scalability.
@inproceedings{
 title = {Parallel and quantitative sequential pattern mining for large-scale interval-based temporal data},
 type = {inproceedings},
 year = {2015},
 id = {d5f1bad9-17f5-3abf-a766-5148951a9db5},
 created = {2018-03-05T18:20:23.969Z},
 file_attached = {false},
 profile_id = {42d295c0-0737-38d6-8b43-508cab6ea85d},
 group_id = {9d761a94-2f2d-31ce-a8c3-50aa6d668643},
 last_modified = {2018-03-05T18:20:23.969Z},
 read = {false},
 starred = {false},
 authored = {false},
 confirmed = {false},
 hidden = {false},
 citation_key = {Ruan2015},
 private_publication = {false},
 abstract = {© 2014 IEEE. Mining frequent subsequences of patterns, or sequential pattern mining, has wide application in customer shopping sequence analysis, web log stream analysis, multi-modal behavioral studies, to name a few. To detect unknown, anomalous, and unexpected patterns from large-scale interval-based temporal data without complete a priori knowledge is challenging. In this paper, we present a framework - PESMiner which allows parallel and quantitative mining of sequential patterns at scale. Whereas most existing sequential mining algorithms can only find sequential orders of temporal events, our work presents a novel interactive temporal data mining algorithm capable of extracting precise temporal properties of sequential patterns. Furthermore, our work provides a unified parallel solution that scales our algorithms to larger temporal data sets by exploiting iterative MapReduce tasks. Comprehensive performance evaluations demonstrate that PESMiner significantly outperforms existing interval-based mining algorithms in terms of both quality (i.e. accuracy, precision, and recall) and scalability.},
 bibtype = {inproceedings},
 author = {Ruan, G. and Zhang, H. and Plale, B.},
 doi = {10.1109/BigData.2014.7004410},
 booktitle = {Proceedings - 2014 IEEE International Conference on Big Data, IEEE Big Data 2014}
}

Downloads: 0