Optimized routing for large-scale InfiniBand networks. Hoefler, T., Schneider, T., & Lumsdaine, A. In Proceedings - Symposium on the High Performance Interconnects, Hot Interconnects, pages 103-111, 2009.
Optimized routing for large-scale InfiniBand networks [link]Website  doi  abstract   bibtex   
Point-to-point metrics, such as latency and bandwidth, are often used to characterize network performance with the consequent assumption that optimizing for these metrics is sufficient to improve parallel application performance. However, these metrics can only provide limited insight into application behavior because they do not fully account for effects, such as network congestion, that significantly influence overall network performance. Because many high-performance networks use deterministic oblivious routing, one such effect is the choice of routing algorithm. In this paper, we analyze and compare practical and theoretical aspects of different routing algorithms that are used in today's large-scale networks. We show that widely-used theoretical metrics, such as edge-forwarding index or bisection bandwidth, are not accurate predictors for average network bandwidth. Instead, we introduce an intuitive metric, which we call "effective bisection bandwidth" to characterize quality of different routing algorithms. We present a simple algorithm that globally balances routes and therefore improves the effective bandwidth of the network. Compared to the best algorithm in use today, our new algorithm shows an improvement in effective bisection bandwidth of 40% on a 724-endpoint InfiniBand cluster. © 2009 IEEE.
@inproceedings{
 title = {Optimized routing for large-scale InfiniBand networks},
 type = {inproceedings},
 year = {2009},
 keywords = {Bandwidth; Network performance; Queueing networks,Bisection bandwidth; Effective bandwidth; Forwardi,Clustering algorithms},
 pages = {103-111},
 websites = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-77950933459&doi=10.1109%2FHOTI.2009.9&partnerID=40&md5=4c8196273b263f9b44dfeed3a659a6b8},
 city = {New York, NY},
 id = {9f4e52bc-feb5-313d-b34f-f18c238f4b00},
 created = {2018-01-09T20:30:39.052Z},
 file_attached = {false},
 profile_id = {42d295c0-0737-38d6-8b43-508cab6ea85d},
 last_modified = {2018-03-12T19:03:18.209Z},
 read = {false},
 starred = {false},
 authored = {true},
 confirmed = {true},
 hidden = {false},
 citation_key = {Hoefler2009103},
 source_type = {conference},
 notes = {cited By 17; Conference of 17th IEEE Symposium on High Performance Interconnects, HOTI 2009 ; Conference Date: 25 August 2009 Through 27 August 2009; Conference Code:79862},
 folder_uuids = {2aba6c14-9027-4f47-8627-0902e1e2342b},
 private_publication = {false},
 abstract = {Point-to-point metrics, such as latency and bandwidth, are often used to characterize network performance with the consequent assumption that optimizing for these metrics is sufficient to improve parallel application performance. However, these metrics can only provide limited insight into application behavior because they do not fully account for effects, such as network congestion, that significantly influence overall network performance. Because many high-performance networks use deterministic oblivious routing, one such effect is the choice of routing algorithm. In this paper, we analyze and compare practical and theoretical aspects of different routing algorithms that are used in today's large-scale networks. We show that widely-used theoretical metrics, such as edge-forwarding index or bisection bandwidth, are not accurate predictors for average network bandwidth. Instead, we introduce an intuitive metric, which we call "effective bisection bandwidth" to characterize quality of different routing algorithms. We present a simple algorithm that globally balances routes and therefore improves the effective bandwidth of the network. Compared to the best algorithm in use today, our new algorithm shows an improvement in effective bisection bandwidth of 40% on a 724-endpoint InfiniBand cluster. © 2009 IEEE.},
 bibtype = {inproceedings},
 author = {Hoefler, T and Schneider, T and Lumsdaine, A},
 doi = {10.1109/HOTI.2009.9},
 booktitle = {Proceedings - Symposium on the High Performance Interconnects, Hot Interconnects}
}

Downloads: 0