Streaming-data algorithms for high-quality clustering. O'Callaghan, L., Mishra, N., Meyerson, A., Guha, S., & Motwani, R. In Proceedings 18th International Conference on Data Engineering, pages 685–694, February, 2002. ISSN: 1063-6382doi abstract bibtex Streaming data analysis has recently attracted attention in numerous applications including telephone records, Web documents and click streams. For such analysis, single-pass algorithms that consume a small amount of memory are critical. We describe such a streaming algorithm that effectively clusters large data streams. We also provide empirical evidence of the algorithm's performance on synthetic and real data streams.
@inproceedings{ocallaghan_streaming-data_2002,
title = {Streaming-data algorithms for high-quality clustering},
doi = {10.1109/ICDE.2002.994785},
abstract = {Streaming data analysis has recently attracted attention in numerous applications including telephone records, Web documents and click streams. For such analysis, single-pass algorithms that consume a small amount of memory are critical. We describe such a streaming algorithm that effectively clusters large data streams. We also provide empirical evidence of the algorithm's performance on synthetic and real data streams.},
booktitle = {Proceedings 18th {International} {Conference} on {Data} {Engineering}},
author = {O'Callaghan, L. and Mishra, N. and Meyerson, A. and Guha, S. and Motwani, R.},
month = feb,
year = {2002},
note = {ISSN: 1063-6382},
keywords = {Algorithm design and analysis, Clustering algorithms, Computer science, Data analysis, Data engineering, Lab-on-a-chip, Laboratories, Partitioning algorithms, Telecommunications, Telephony},
pages = {685--694},
}
Downloads: 0
{"_id":"odevEc7TDz6jNPtiX","bibbaseid":"ocallaghan-mishra-meyerson-guha-motwani-streamingdataalgorithmsforhighqualityclustering-2002","author_short":["O'Callaghan, L.","Mishra, N.","Meyerson, A.","Guha, S.","Motwani, R."],"bibdata":{"bibtype":"inproceedings","type":"inproceedings","title":"Streaming-data algorithms for high-quality clustering","doi":"10.1109/ICDE.2002.994785","abstract":"Streaming data analysis has recently attracted attention in numerous applications including telephone records, Web documents and click streams. For such analysis, single-pass algorithms that consume a small amount of memory are critical. We describe such a streaming algorithm that effectively clusters large data streams. We also provide empirical evidence of the algorithm's performance on synthetic and real data streams.","booktitle":"Proceedings 18th International Conference on Data Engineering","author":[{"propositions":[],"lastnames":["O'Callaghan"],"firstnames":["L."],"suffixes":[]},{"propositions":[],"lastnames":["Mishra"],"firstnames":["N."],"suffixes":[]},{"propositions":[],"lastnames":["Meyerson"],"firstnames":["A."],"suffixes":[]},{"propositions":[],"lastnames":["Guha"],"firstnames":["S."],"suffixes":[]},{"propositions":[],"lastnames":["Motwani"],"firstnames":["R."],"suffixes":[]}],"month":"February","year":"2002","note":"ISSN: 1063-6382","keywords":"Algorithm design and analysis, Clustering algorithms, Computer science, Data analysis, Data engineering, Lab-on-a-chip, Laboratories, Partitioning algorithms, Telecommunications, Telephony","pages":"685–694","bibtex":"@inproceedings{ocallaghan_streaming-data_2002,\n\ttitle = {Streaming-data algorithms for high-quality clustering},\n\tdoi = {10.1109/ICDE.2002.994785},\n\tabstract = {Streaming data analysis has recently attracted attention in numerous applications including telephone records, Web documents and click streams. For such analysis, single-pass algorithms that consume a small amount of memory are critical. We describe such a streaming algorithm that effectively clusters large data streams. We also provide empirical evidence of the algorithm's performance on synthetic and real data streams.},\n\tbooktitle = {Proceedings 18th {International} {Conference} on {Data} {Engineering}},\n\tauthor = {O'Callaghan, L. and Mishra, N. and Meyerson, A. and Guha, S. and Motwani, R.},\n\tmonth = feb,\n\tyear = {2002},\n\tnote = {ISSN: 1063-6382},\n\tkeywords = {Algorithm design and analysis, Clustering algorithms, Computer science, Data analysis, Data engineering, Lab-on-a-chip, Laboratories, Partitioning algorithms, Telecommunications, Telephony},\n\tpages = {685--694},\n}\n\n\n\n","author_short":["O'Callaghan, L.","Mishra, N.","Meyerson, A.","Guha, S.","Motwani, R."],"key":"ocallaghan_streaming-data_2002","id":"ocallaghan_streaming-data_2002","bibbaseid":"ocallaghan-mishra-meyerson-guha-motwani-streamingdataalgorithmsforhighqualityclustering-2002","role":"author","urls":{},"keyword":["Algorithm design and analysis","Clustering algorithms","Computer science","Data analysis","Data engineering","Lab-on-a-chip","Laboratories","Partitioning algorithms","Telecommunications","Telephony"],"metadata":{"authorlinks":{}},"html":""},"bibtype":"inproceedings","biburl":"https://bibbase.org/zotero/mh_lenguyen","dataSources":["iwKepCrWBps7ojhDx"],"keywords":["algorithm design and analysis","clustering algorithms","computer science","data analysis","data engineering","lab-on-a-chip","laboratories","partitioning algorithms","telecommunications","telephony"],"search_terms":["streaming","data","algorithms","high","quality","clustering","o'callaghan","mishra","meyerson","guha","motwani"],"title":"Streaming-data algorithms for high-quality clustering","year":2002}