Replication-based fault tolerance for MPI applications. Walters, J. P. & Chaudhary, V. IEEE Transactions on Parallel and Distributed Systems, 20(7):997–1010, IEEE, 2008.
bibtex   
@article{walters2008replication,
  title={Replication-based fault tolerance for MPI applications},
  author={Walters, John Paul and Chaudhary, Vipin},
  journal={IEEE Transactions on Parallel and Distributed Systems},
  volume={20},
  number={7},
  pages={997--1010},
  year={2008},
  publisher={IEEE}
}

Downloads: 0