The effect of network noise on large-scale collective communications. Hoefler, T., Schneider, T., & Lumsdaine, A. Parallel Processing Letters, 19(4):573-593, 2009.
The effect of network noise on large-scale collective communications [link]Website  doi  abstract   bibtex   
The effect of operating system (OS) noise on the performance of large-scale applications is a growing concern and ameliorating the influence of OS noise is a subject of active research. A related problem is that of network noise that arises from the shared use of the interconnection network by parallel processes of different allocations or other background activities. To characterize the effect of network noise on parallel applications, we conducted a series of experiments with a specially crafted benchmark and simulations. Experimental results show a decrease in the communication performance of a parallel reduction operation by a factor of 2 on 246 nodes on an InfiniBand fat-tree and by several orders of magnitude on a BlueGene/P torus. Simulations show how influence of network noise grows with the system size. Although network noise is not as well-studied as OS noise, our results clearly show that it is an important factor that must be considered when running and analyzing large-scale applications. © 2009 World Scientific Publishing Company.
@article{
 title = {The effect of network noise on large-scale collective communications},
 type = {article},
 year = {2009},
 keywords = {Benchmarking; Communication; Computer operating s,Collective communications; Communication performan,Computer simulation},
 pages = {573-593},
 volume = {19},
 websites = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-73849109430&doi=10.1142%2FS0129626409000420&partnerID=40&md5=70e40b3a9f7f80d1e7551d0c403291bb},
 id = {65c77db5-bddc-315c-a47e-ec12af40351e},
 created = {2018-01-09T20:30:38.267Z},
 file_attached = {false},
 profile_id = {42d295c0-0737-38d6-8b43-508cab6ea85d},
 last_modified = {2018-03-12T19:03:18.645Z},
 read = {false},
 starred = {false},
 authored = {true},
 confirmed = {true},
 hidden = {false},
 citation_key = {Hoefler2009573},
 source_type = {article},
 notes = {cited By 3},
 folder_uuids = {2aba6c14-9027-4f47-8627-0902e1e2342b},
 private_publication = {false},
 abstract = {The effect of operating system (OS) noise on the performance of large-scale applications is a growing concern and ameliorating the influence of OS noise is a subject of active research. A related problem is that of network noise that arises from the shared use of the interconnection network by parallel processes of different allocations or other background activities. To characterize the effect of network noise on parallel applications, we conducted a series of experiments with a specially crafted benchmark and simulations. Experimental results show a decrease in the communication performance of a parallel reduction operation by a factor of 2 on 246 nodes on an InfiniBand fat-tree and by several orders of magnitude on a BlueGene/P torus. Simulations show how influence of network noise grows with the system size. Although network noise is not as well-studied as OS noise, our results clearly show that it is an important factor that must be considered when running and analyzing large-scale applications. © 2009 World Scientific Publishing Company.},
 bibtype = {article},
 author = {Hoefler, T and Schneider, T and Lumsdaine, A},
 doi = {10.1142/S0129626409000420},
 journal = {Parallel Processing Letters},
 number = {4}
}

Downloads: 0