Evaluating the jaccard-tanimoto index on multi-core architectures. Sachdeva, V., Freimuth, D., M., & Mueller, C. Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), 5544 LNCS(PART 1):944-953, 2009. Website doi abstract bibtex The Jaccard/Tanimoto coefficient is an important workload, used in a large variety of problems including drug design fingerprinting, clustering analysis, similarity web searching and image segmentation. This paper evaluates the Jaccard coefficient on three platforms: the Cell Broadband Engine TMprocessor Intel ®Xeon ®dual-core platform and Nvidia ®8800 GTX GPU. In our work, we have developed a novel parallel algorithm specially suited for the Cell/B.E. architecture for all-to-all Jaccard comparisons, that minimizes DMA transfers and reuses data in the local store. We show that our implementation on Cell/B.E. outperforms the implementations on comparable Intel platforms by 6-20X with full accuracy, and from 10-50X in reduced accuracy mode, depending on the size of the data, and by more than 60X compared to Nvidia 8800 GTX. In addition to performance, we also discuss in detail our efforts to optimize our workload on these architectures and explain how avenues for optimization on each architecture are very different and vary from one architecture to another for our workload. Our work shows that the algorithms or kernels employed for the Jaccard coefficient calculation are heavily dependent on the traits of the target hardware. © 2009 Springer Berlin Heidelberg.
@article{
title = {Evaluating the jaccard-tanimoto index on multi-core architectures},
type = {article},
year = {2009},
keywords = {Architectural design,Cell Broadband Engine; Clustering analysis; DMA tr,Cell membranes; Parallel algorithms},
pages = {944-953},
volume = {5544 LNCS},
websites = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-68849090741&doi=10.1007%2F978-3-642-01970-8_95&partnerID=40&md5=b8387401b0d11a665e2af33dd56557e4},
city = {Baton Rouge, LA},
id = {7440f35c-4ee5-3b60-b0ec-cbdea0c09d4a},
created = {2018-01-09T20:30:37.946Z},
file_attached = {false},
profile_id = {42d295c0-0737-38d6-8b43-508cab6ea85d},
last_modified = {2018-03-12T19:03:19.010Z},
read = {false},
starred = {false},
authored = {true},
confirmed = {true},
hidden = {false},
citation_key = {Sachdeva2009944},
source_type = {article},
notes = {cited By 6; Conference of 9th International Conference on Computational Science, ICCS 2009 ; Conference Date: 25 May 2009 Through 27 May 2009; Conference Code:77033},
folder_uuids = {2aba6c14-9027-4f47-8627-0902e1e2342b},
private_publication = {false},
abstract = {The Jaccard/Tanimoto coefficient is an important workload, used in a large variety of problems including drug design fingerprinting, clustering analysis, similarity web searching and image segmentation. This paper evaluates the Jaccard coefficient on three platforms: the Cell Broadband Engine TMprocessor Intel ®Xeon ®dual-core platform and Nvidia ®8800 GTX GPU. In our work, we have developed a novel parallel algorithm specially suited for the Cell/B.E. architecture for all-to-all Jaccard comparisons, that minimizes DMA transfers and reuses data in the local store. We show that our implementation on Cell/B.E. outperforms the implementations on comparable Intel platforms by 6-20X with full accuracy, and from 10-50X in reduced accuracy mode, depending on the size of the data, and by more than 60X compared to Nvidia 8800 GTX. In addition to performance, we also discuss in detail our efforts to optimize our workload on these architectures and explain how avenues for optimization on each architecture are very different and vary from one architecture to another for our workload. Our work shows that the algorithms or kernels employed for the Jaccard coefficient calculation are heavily dependent on the traits of the target hardware. © 2009 Springer Berlin Heidelberg.},
bibtype = {article},
author = {Sachdeva, V and Freimuth, D M and Mueller, C},
doi = {10.1007/978-3-642-01970-8_95},
journal = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)},
number = {PART 1}
}
Downloads: 0
{"_id":"yWGb7yKXk593oBbEk","bibbaseid":"sachdeva-freimuth-mueller-evaluatingthejaccardtanimotoindexonmulticorearchitectures-2009","downloads":0,"creationDate":"2018-03-12T19:10:28.087Z","title":"Evaluating the jaccard-tanimoto index on multi-core architectures","author_short":["Sachdeva, V.","Freimuth, D., M.","Mueller, C."],"year":2009,"bibtype":"article","biburl":"https://bibbase.org/service/mendeley/42d295c0-0737-38d6-8b43-508cab6ea85d","bibdata":{"title":"Evaluating the jaccard-tanimoto index on multi-core architectures","type":"article","year":"2009","keywords":"Architectural design,Cell Broadband Engine; Clustering analysis; DMA tr,Cell membranes; Parallel algorithms","pages":"944-953","volume":"5544 LNCS","websites":"https://www.scopus.com/inward/record.uri?eid=2-s2.0-68849090741&doi=10.1007%2F978-3-642-01970-8_95&partnerID=40&md5=b8387401b0d11a665e2af33dd56557e4","city":"Baton Rouge, LA","id":"7440f35c-4ee5-3b60-b0ec-cbdea0c09d4a","created":"2018-01-09T20:30:37.946Z","file_attached":false,"profile_id":"42d295c0-0737-38d6-8b43-508cab6ea85d","last_modified":"2018-03-12T19:03:19.010Z","read":false,"starred":false,"authored":"true","confirmed":"true","hidden":false,"citation_key":"Sachdeva2009944","source_type":"article","notes":"cited By 6; Conference of 9th International Conference on Computational Science, ICCS 2009 ; Conference Date: 25 May 2009 Through 27 May 2009; Conference Code:77033","folder_uuids":"2aba6c14-9027-4f47-8627-0902e1e2342b","private_publication":false,"abstract":"The Jaccard/Tanimoto coefficient is an important workload, used in a large variety of problems including drug design fingerprinting, clustering analysis, similarity web searching and image segmentation. This paper evaluates the Jaccard coefficient on three platforms: the Cell Broadband Engine TMprocessor Intel ®Xeon ®dual-core platform and Nvidia ®8800 GTX GPU. In our work, we have developed a novel parallel algorithm specially suited for the Cell/B.E. architecture for all-to-all Jaccard comparisons, that minimizes DMA transfers and reuses data in the local store. We show that our implementation on Cell/B.E. outperforms the implementations on comparable Intel platforms by 6-20X with full accuracy, and from 10-50X in reduced accuracy mode, depending on the size of the data, and by more than 60X compared to Nvidia 8800 GTX. In addition to performance, we also discuss in detail our efforts to optimize our workload on these architectures and explain how avenues for optimization on each architecture are very different and vary from one architecture to another for our workload. Our work shows that the algorithms or kernels employed for the Jaccard coefficient calculation are heavily dependent on the traits of the target hardware. © 2009 Springer Berlin Heidelberg.","bibtype":"article","author":"Sachdeva, V and Freimuth, D M and Mueller, C","doi":"10.1007/978-3-642-01970-8_95","journal":"Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)","number":"PART 1","bibtex":"@article{\n title = {Evaluating the jaccard-tanimoto index on multi-core architectures},\n type = {article},\n year = {2009},\n keywords = {Architectural design,Cell Broadband Engine; Clustering analysis; DMA tr,Cell membranes; Parallel algorithms},\n pages = {944-953},\n volume = {5544 LNCS},\n websites = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-68849090741&doi=10.1007%2F978-3-642-01970-8_95&partnerID=40&md5=b8387401b0d11a665e2af33dd56557e4},\n city = {Baton Rouge, LA},\n id = {7440f35c-4ee5-3b60-b0ec-cbdea0c09d4a},\n created = {2018-01-09T20:30:37.946Z},\n file_attached = {false},\n profile_id = {42d295c0-0737-38d6-8b43-508cab6ea85d},\n last_modified = {2018-03-12T19:03:19.010Z},\n read = {false},\n starred = {false},\n authored = {true},\n confirmed = {true},\n hidden = {false},\n citation_key = {Sachdeva2009944},\n source_type = {article},\n notes = {cited By 6; Conference of 9th International Conference on Computational Science, ICCS 2009 ; Conference Date: 25 May 2009 Through 27 May 2009; Conference Code:77033},\n folder_uuids = {2aba6c14-9027-4f47-8627-0902e1e2342b},\n private_publication = {false},\n abstract = {The Jaccard/Tanimoto coefficient is an important workload, used in a large variety of problems including drug design fingerprinting, clustering analysis, similarity web searching and image segmentation. This paper evaluates the Jaccard coefficient on three platforms: the Cell Broadband Engine TMprocessor Intel ®Xeon ®dual-core platform and Nvidia ®8800 GTX GPU. In our work, we have developed a novel parallel algorithm specially suited for the Cell/B.E. architecture for all-to-all Jaccard comparisons, that minimizes DMA transfers and reuses data in the local store. We show that our implementation on Cell/B.E. outperforms the implementations on comparable Intel platforms by 6-20X with full accuracy, and from 10-50X in reduced accuracy mode, depending on the size of the data, and by more than 60X compared to Nvidia 8800 GTX. In addition to performance, we also discuss in detail our efforts to optimize our workload on these architectures and explain how avenues for optimization on each architecture are very different and vary from one architecture to another for our workload. Our work shows that the algorithms or kernels employed for the Jaccard coefficient calculation are heavily dependent on the traits of the target hardware. © 2009 Springer Berlin Heidelberg.},\n bibtype = {article},\n author = {Sachdeva, V and Freimuth, D M and Mueller, C},\n doi = {10.1007/978-3-642-01970-8_95},\n journal = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)},\n number = {PART 1}\n}","author_short":["Sachdeva, V.","Freimuth, D., M.","Mueller, C."],"urls":{"Website":"https://www.scopus.com/inward/record.uri?eid=2-s2.0-68849090741&doi=10.1007%2F978-3-642-01970-8_95&partnerID=40&md5=b8387401b0d11a665e2af33dd56557e4"},"biburl":"https://bibbase.org/service/mendeley/42d295c0-0737-38d6-8b43-508cab6ea85d","bibbaseid":"sachdeva-freimuth-mueller-evaluatingthejaccardtanimotoindexonmulticorearchitectures-2009","role":"author","keyword":["Architectural design","Cell Broadband Engine; Clustering analysis; DMA tr","Cell membranes; Parallel algorithms"],"metadata":{"authorlinks":{}},"downloads":0},"search_terms":["evaluating","jaccard","tanimoto","index","multi","core","architectures","sachdeva","freimuth","mueller"],"keywords":["architectural design","cell broadband engine; clustering analysis; dma tr","cell membranes; parallel algorithms"],"authorIDs":[],"dataSources":["zgahneP4uAjKbudrQ","ya2CyA73rpZseyrZ8","2252seNhipfTmjEBQ"]}