@inproceedings{3cb8a7a9741848d396cd99f9b56d159f,
title = "A Formal Approach for Failure Detection in Large-Scale Distributed Systems Using Abstract State Machines",
abstract = "Large-scale distributed systems have been widely adopted in various domains due to their ability to compose services and resources tailored to user requirements. Such systems are characterized by high complexity and heterogeneity. Maintaining a high-level availability and a normal execution of the components implies precise monitoring and robust adaptation. Monitors capture relevant metrics and transform them to meaningful knowledge, which is further used in justifying adaptation actions. The current paper proposes an Abstract State Machine model for defining monitoring processes addressing failures and unavailability of the system nodes. The specification is simulated and validated with the aid of the ASMETA toolset. The solution is complemented with a small ontology reflecting the structure of the system. We emphasize the role of formal models in achieving the proposed requirements.",
author = "Andreea Buga and Sorana-Tania Nemes",
year = "2017",
doi = "10.1007/978-3-319-64468-4\_38",
language = "English",
isbn = "978-3-319-64467-7",
volume = "10438",
series = "Lecture Notes in Computer Science (LNCS)",
publisher = "Springer Verlag",
pages = "505--513",
editor = "Springer",
booktitle = "Database and Expert Systems Applications - 28th International Conference, DEXA 2017, Lyon, France, August 28-31, 2017, Proceedings, Part I",
}