Parallel and quantitative sequential pattern mining for large-scale interval-based temporal data. Ruan, G., Zhang, H., & Plale, B. In Proceedings - 2014 IEEE International Conference on Big Data, IEEE Big Data 2014, 2015. doi abstract bibtex © 2014 IEEE. Mining frequent subsequences of patterns, or sequential pattern mining, has wide application in customer shopping sequence analysis, web log stream analysis, multi-modal behavioral studies, to name a few. To detect unknown, anomalous, and unexpected patterns from large-scale interval-based temporal data without complete a priori knowledge is challenging. In this paper, we present a framework - PESMiner which allows parallel and quantitative mining of sequential patterns at scale. Whereas most existing sequential mining algorithms can only find sequential orders of temporal events, our work presents a novel interactive temporal data mining algorithm capable of extracting precise temporal properties of sequential patterns. Furthermore, our work provides a unified parallel solution that scales our algorithms to larger temporal data sets by exploiting iterative MapReduce tasks. Comprehensive performance evaluations demonstrate that PESMiner significantly outperforms existing interval-based mining algorithms in terms of both quality (i.e. accuracy, precision, and recall) and scalability.
@inproceedings{
title = {Parallel and quantitative sequential pattern mining for large-scale interval-based temporal data},
type = {inproceedings},
year = {2015},
id = {de801e1d-18aa-3f8a-b4bc-5bda75a5217f},
created = {2019-10-01T17:20:46.860Z},
file_attached = {false},
profile_id = {42d295c0-0737-38d6-8b43-508cab6ea85d},
last_modified = {2019-10-01T17:23:35.232Z},
read = {false},
starred = {false},
authored = {true},
confirmed = {true},
hidden = {false},
citation_key = {Ruan2015},
folder_uuids = {73f994b4-a3be-4035-a6dd-3802077ce863},
private_publication = {false},
abstract = {© 2014 IEEE. Mining frequent subsequences of patterns, or sequential pattern mining, has wide application in customer shopping sequence analysis, web log stream analysis, multi-modal behavioral studies, to name a few. To detect unknown, anomalous, and unexpected patterns from large-scale interval-based temporal data without complete a priori knowledge is challenging. In this paper, we present a framework - PESMiner which allows parallel and quantitative mining of sequential patterns at scale. Whereas most existing sequential mining algorithms can only find sequential orders of temporal events, our work presents a novel interactive temporal data mining algorithm capable of extracting precise temporal properties of sequential patterns. Furthermore, our work provides a unified parallel solution that scales our algorithms to larger temporal data sets by exploiting iterative MapReduce tasks. Comprehensive performance evaluations demonstrate that PESMiner significantly outperforms existing interval-based mining algorithms in terms of both quality (i.e. accuracy, precision, and recall) and scalability.},
bibtype = {inproceedings},
author = {Ruan, G. and Zhang, H. and Plale, B.},
doi = {10.1109/BigData.2014.7004410},
booktitle = {Proceedings - 2014 IEEE International Conference on Big Data, IEEE Big Data 2014}
}