The event notification and alarm system for the Open Science Grid operations center. Hayashi, S., Teige, S., & Quick, R. Journal of Physics: Conference Series, 2012.
The event notification and alarm system for the Open Science Grid operations center [link]Website  abstract   bibtex   
The Open Science Grid Operations (OSG) Team operates a distributed set of services and tools that enable the utilization of the OSG by several HEP projects. Without these services users of the OSG would not be able to run jobs, locate resources, obtain information about the status of systems or generally use the OSG. For this reason these services must be highly available. This paper describes the automated monitoring and notification systems used to diagnose and report problems. Described here are the means used by OSG Operations to monitor systems such as physical facilities, network operations, server health, service availability and software error events. Once detected, an error condition generates a message sent to, for example, Email, SMS, Twitter, an Instant Message Server, etc. The mechanism being developed to integrate these monitoring systems into a prioritized and configurable alarming system is emphasized. © Published under licence by IOP Publishing Ltd.
@article{
 title = {The event notification and alarm system for the Open Science Grid operations center},
 type = {article},
 year = {2012},
 identifiers = {[object Object]},
 keywords = {Alarm systems,Automated monitoring; Error condition; Event notif,Nuclear physics},
 volume = {396},
 websites = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-84873302521&doi=10.1088%2F1742-6596%2F396%2F3%2F032105&partnerID=40&md5=7b5d9c45549428cd1c7c4fc8e5cdb164},
 city = {New York, NY},
 id = {51f38d1f-0fd3-3ab8-bc93-57f45ffbabb7},
 created = {2018-02-27T18:07:25.542Z},
 file_attached = {false},
 profile_id = {42d295c0-0737-38d6-8b43-508cab6ea85d},
 group_id = {27e0553c-8ec0-31bd-b42c-825b8a5a9ae8},
 last_modified = {2018-02-27T18:07:25.542Z},
 read = {false},
 starred = {false},
 authored = {false},
 confirmed = {true},
 hidden = {false},
 citation_key = {Hayashi2012},
 source_type = {article},
 notes = {cited By 1; Conference of International Conference on Computing in High Energy and Nuclear Physics 2012, CHEP 2012 ; Conference Date: 21 May 2012 Through 25 May 2012; Conference Code:95155},
 private_publication = {false},
 abstract = {The Open Science Grid Operations (OSG) Team operates a distributed set of services and tools that enable the utilization of the OSG by several HEP projects. Without these services users of the OSG would not be able to run jobs, locate resources, obtain information about the status of systems or generally use the OSG. For this reason these services must be highly available. This paper describes the automated monitoring and notification systems used to diagnose and report problems. Described here are the means used by OSG Operations to monitor systems such as physical facilities, network operations, server health, service availability and software error events. Once detected, an error condition generates a message sent to, for example, Email, SMS, Twitter, an Instant Message Server, etc. The mechanism being developed to integrate these monitoring systems into a prioritized and configurable alarming system is emphasized. © Published under licence by IOP Publishing Ltd.},
 bibtype = {article},
 author = {Hayashi, S and Teige, S and Quick, R},
 journal = {Journal of Physics: Conference Series},
 number = {PART 3}
}

Downloads: 0