Predictive Reliability and Fault Management in Exascale Systems: State of the Art and Perspectives. Canal, R., Hern'andez, C., Tornero, R., Cilardo, A., Massari, G., Reghenzani, F., Fornaciari, W., Zapater, M., Atienza, D., Oleksiak, A., Piatek, W., & Abella, J. ACM Comput. Surv., 53(5):95:1–95:32, 2021.
Predictive Reliability and Fault Management in Exascale Systems: State of the Art and Perspectives [link]Paper  doi  bibtex   
@article{DBLP:journals/csur/CanalHTCMRFZAOP20,
  author    = {Ramon Canal and
               Carles Hern{\'{a}}ndez and
               Rafael Tornero and
               Alessandro Cilardo and
               Giuseppe Massari and
               Federico Reghenzani and
               William Fornaciari and
               Marina Zapater and
               David Atienza and
               Ariel Oleksiak and
               Wojciech Piatek and
               Jaume Abella},
  title     = {Predictive Reliability and Fault Management in Exascale Systems: State
               of the Art and Perspectives},
  journal   = {{ACM} Comput. Surv.},
  volume    = {53},
  number    = {5},
  pages     = {95:1--95:32},
  year      = {2021},
  url       = {https://doi.org/10.1145/3403956},
  doi       = {10.1145/3403956},
  timestamp = {Wed, 23 Nov 2022 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/journals/csur/CanalHTCMRFZAOP20.bib},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}

Downloads: 0