Scalable Distributed DNN Training using TensorFlow and CUDA-Aware MPI: Characterization, Designs, and Performance Evaluation

Scalable Distributed DNN Training using TensorFlow and CUDA-Aware MPI: Characterization, Designs, and Performance Evaluation. Awan, A. A., Bédorf, J., Chu, C., Subramoni, H., & Panda, D. K. CoRR, 2018.

Paper bibtex

@article{DBLP:journals/corr/abs-1810-11112,
  author    = {Ammar Ahmad Awan and
               Jeroen B{\'{e}}dorf and
               Ching{-}Hsiang Chu and
               Hari Subramoni and
               Dhabaleswar K. Panda},
  title     = {Scalable Distributed {DNN} Training using TensorFlow and CUDA-Aware
               {MPI:} Characterization, Designs, and Performance Evaluation},
  journal   = {CoRR},
  volume    = {abs/1810.11112},
  year      = {2018},
  url       = {http://arxiv.org/abs/1810.11112},
  archivePrefix = {arXiv},
  eprint    = {1810.11112},
  timestamp = {Wed, 31 Oct 2018 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/journals/corr/abs-1810-11112},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}

Downloads: 0

{"_id":"YZAWTf4CadpPgdRPY","bibbaseid":"awan-bdorf-chu-subramoni-panda-scalabledistributeddnntrainingusingtensorflowandcudaawarempicharacterizationdesignsandperformanceevaluation-2018","downloads":0,"creationDate":"2019-03-26T15:13:04.531Z","title":"Scalable Distributed DNN Training using TensorFlow and CUDA-Aware MPI: Characterization, Designs, and Performance Evaluation","author_short":["Awan, A. A.","Bédorf, J.","Chu, C.","Subramoni, H.","Panda, D. K."],"year":2018,"bibtype":"article","biburl":"https://dblp.org/pid/60/9487.bib","bibdata":{"bibtype":"article","type":"article","author":[{"firstnames":["Ammar","Ahmad"],"propositions":[],"lastnames":["Awan"],"suffixes":[]},{"firstnames":["Jeroen"],"propositions":[],"lastnames":["Bédorf"],"suffixes":[]},{"firstnames":["Ching-Hsiang"],"propositions":[],"lastnames":["Chu"],"suffixes":[]},{"firstnames":["Hari"],"propositions":[],"lastnames":["Subramoni"],"suffixes":[]},{"firstnames":["Dhabaleswar","K."],"propositions":[],"lastnames":["Panda"],"suffixes":[]}],"title":"Scalable Distributed DNN Training using TensorFlow and CUDA-Aware MPI: Characterization, Designs, and Performance Evaluation","journal":"CoRR","volume":"abs/1810.11112","year":"2018","url":"http://arxiv.org/abs/1810.11112","archiveprefix":"arXiv","eprint":"1810.11112","timestamp":"Wed, 31 Oct 2018 00:00:00 +0100","biburl":"https://dblp.org/rec/bib/journals/corr/abs-1810-11112","bibsource":"dblp computer science bibliography, https://dblp.org","bibtex":"@article{DBLP:journals/corr/abs-1810-11112,\n author = {Ammar Ahmad Awan and\n Jeroen B{\\'{e}}dorf and\n Ching{-}Hsiang Chu and\n Hari Subramoni and\n Dhabaleswar K. Panda},\n title = {Scalable Distributed {DNN} Training using TensorFlow and CUDA-Aware\n {MPI:} Characterization, Designs, and Performance Evaluation},\n journal = {CoRR},\n volume = {abs/1810.11112},\n year = {2018},\n url = {http://arxiv.org/abs/1810.11112},\n archivePrefix = {arXiv},\n eprint = {1810.11112},\n timestamp = {Wed, 31 Oct 2018 00:00:00 +0100},\n biburl = {https://dblp.org/rec/bib/journals/corr/abs-1810-11112},\n bibsource = {dblp computer science bibliography, https://dblp.org}\n}\n\n","author_short":["Awan, A. A.","Bédorf, J.","Chu, C.","Subramoni, H.","Panda, D. K."],"key":"DBLP:journals/corr/abs-1810-11112","id":"DBLP:journals/corr/abs-1810-11112","bibbaseid":"awan-bdorf-chu-subramoni-panda-scalabledistributeddnntrainingusingtensorflowandcudaawarempicharacterizationdesignsandperformanceevaluation-2018","role":"author","urls":{"Paper":"http://arxiv.org/abs/1810.11112"},"downloads":0},"search_terms":["scalable","distributed","dnn","training","using","tensorflow","cuda","aware","mpi","characterization","designs","performance","evaluation","awan","bédorf","chu","subramoni","panda"],"keywords":[],"authorIDs":[],"dataSources":["ofX3Q3Jrhh9o9JFMa"]}