Message progression in parallel computing - To thread or not to thread?. Hoefler, T. & Lumsdaine, A. In Proceedings - IEEE International Conference on Cluster Computing, ICCC, volume Proceeding, pages 213-222, 2008. Institute of Electrical and Electronics Engineers Inc..
Message progression in parallel computing - To thread or not to thread? [link]Website  doi  abstract   bibtex   
Message progression schemes that enable communication and computation to be overlapped have the potential to improve the performance of parallel applications. With currently available high-performance networks there are several options for making progress: manual progression, use of a progress thread, and communication offload. In this paper we analyze threaded progression approaches, comparing the effects of using shared or dedicated CPU cores for progression. To perform these comparisons, we propose time-based and work-based benchmark schemes. As expected, threaded progression performs well when a spare core is available to be dedicated to communication progression, but a number of operating system effects prevent the same benefits from being obtained when communication progress must share a core with computation. We show that some limited performance improvement can be obtained in the shared-core case by real-time scheduling of the progress thread. © 2008 IEEE.
@inproceedings{
 title = {Message progression in parallel computing - To thread or not to thread?},
 type = {inproceedings},
 year = {2008},
 keywords = {Benchmarking; Parallel processing systems,CPU cores; Operating systems; Parallel applicatio,Communication},
 pages = {213-222},
 volume = {Proceeding},
 websites = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-57949089840&doi=10.1109%2FCLUSTR.2008.4663774&partnerID=40&md5=df816fa322eb7635872ca82b8132d57c},
 publisher = {Institute of Electrical and Electronics Engineers Inc.},
 city = {Tsukuba},
 id = {e7cb2773-8179-3360-94db-67f852463717},
 created = {2018-01-09T20:30:40.129Z},
 file_attached = {false},
 profile_id = {42d295c0-0737-38d6-8b43-508cab6ea85d},
 last_modified = {2018-03-12T19:03:17.842Z},
 read = {false},
 starred = {false},
 authored = {true},
 confirmed = {true},
 hidden = {false},
 citation_key = {Hoefler2008213},
 source_type = {conference},
 notes = {cited By 43; Conference of 2008 IEEE International Conference on Cluster Computing, ICCC 2008 ; Conference Date: 29 September 2008 Through 1 October 2008; Conference Code:74625},
 folder_uuids = {2aba6c14-9027-4f47-8627-0902e1e2342b},
 private_publication = {false},
 abstract = {Message progression schemes that enable communication and computation to be overlapped have the potential to improve the performance of parallel applications. With currently available high-performance networks there are several options for making progress: manual progression, use of a progress thread, and communication offload. In this paper we analyze threaded progression approaches, comparing the effects of using shared or dedicated CPU cores for progression. To perform these comparisons, we propose time-based and work-based benchmark schemes. As expected, threaded progression performs well when a spare core is available to be dedicated to communication progression, but a number of operating system effects prevent the same benefits from being obtained when communication progress must share a core with computation. We show that some limited performance improvement can be obtained in the shared-core case by real-time scheduling of the progress thread. © 2008 IEEE.},
 bibtype = {inproceedings},
 author = {Hoefler, T and Lumsdaine, A},
 doi = {10.1109/CLUSTR.2008.4663774},
 booktitle = {Proceedings - IEEE International Conference on Cluster Computing, ICCC}
}

Downloads: 0