Co-processing SPMD computation on CPUs and GPUs cluster. Li, H., Fox, G., C., Von Laszewski, G., & Chauhan, A. In Proceedings - IEEE International Conference on Cluster Computing, ICCC, 2013.
doi  abstract   bibtex   
Heterogeneous parallel systems with multi processors and accelerators are becoming ubiquitous due to better cost-performance and energy-efficiency. These heterogeneous processor architectures have different instruction sets and are optimized for either task-latency or throughput purposes. Challenges occur in regard to programmability and performance when running SPMD tasks on heterogeneous devices. In order to meet these challenges, we implemented a parallel runtime system that used to co-process SPMD computation on CPUs and GPUs clusters. Furthermore, we are proposing an analytic model to automatically schedule SPMD tasks on heterogeneous clusters. Our analytic model is derived from the roofline model, and therefore it can be applied to a wider range of SPMD applications and hardware devices. The experimental results of the C-means, GMM, and GEMV show good speedup in practical heterogeneous cluster environments. © 2013 IEEE.
@inproceedings{
 title = {Co-processing SPMD computation on CPUs and GPUs cluster},
 type = {inproceedings},
 year = {2013},
 id = {80459917-9e7b-395d-b194-edf6ba8ed10a},
 created = {2019-10-01T17:20:57.374Z},
 file_attached = {false},
 profile_id = {42d295c0-0737-38d6-8b43-508cab6ea85d},
 last_modified = {2019-10-01T17:24:45.895Z},
 read = {false},
 starred = {false},
 authored = {true},
 confirmed = {true},
 hidden = {false},
 citation_key = {Li2013},
 folder_uuids = {82975498-107c-4bb3-bb76-f87bce3e9f6e},
 private_publication = {false},
 abstract = {Heterogeneous parallel systems with multi processors and accelerators are becoming ubiquitous due to better cost-performance and energy-efficiency. These heterogeneous processor architectures have different instruction sets and are optimized for either task-latency or throughput purposes. Challenges occur in regard to programmability and performance when running SPMD tasks on heterogeneous devices. In order to meet these challenges, we implemented a parallel runtime system that used to co-process SPMD computation on CPUs and GPUs clusters. Furthermore, we are proposing an analytic model to automatically schedule SPMD tasks on heterogeneous clusters. Our analytic model is derived from the roofline model, and therefore it can be applied to a wider range of SPMD applications and hardware devices. The experimental results of the C-means, GMM, and GEMV show good speedup in practical heterogeneous cluster environments. © 2013 IEEE.},
 bibtype = {inproceedings},
 author = {Li, H. and Fox, Geoffrey Charles and Von Laszewski, G. and Chauhan, A.},
 doi = {10.1109/CLUSTER.2013.6702632},
 booktitle = {Proceedings - IEEE International Conference on Cluster Computing, ICCC}
}

Downloads: 0