A Fast and Generic GPU-Based Parallel Reduction Implementation. Jradi, W. A. R., Nascimento, H., & Martins, W. S. In 2018 Symposium on High Performance Computing Systems (WSCAD), pages 16-22, Oct, 2018.
doi  bibtex   
@InProceedings{8748915,
  author    = {W. A. R. {Jradi} and H. {Nascimento} and W. S. {Martins}},
  title     = {A Fast and Generic GPU-Based Parallel Reduction Implementation},
  booktitle = {2018 Symposium on High Performance Computing Systems (WSCAD)},
  year      = {2018},
  pages     = {16-22},
  month     = {Oct},
  doi       = {10.1109/WSCAD.2018.00013},
  keywords  = {graphics processing units;multiprocessing systems;parallel architectures;parallel processing;persistent threads;reduction operations;parallel reduction;GPU-based parallel approach;AMD hardware platform;NVidia hardware platform;OpenCL;CUDA;Graphics processing units;Indexes;Synchronization;Hardware;Bandwidth;Proposals;Instruction sets;GPU, Parallel Reduction, Fast, Generic},
}

Downloads: 0