@inproceedings{580acb832e174c46983f1ffd561d1202,
title = "Automatic recovery using bounded partially observable Markov decision processes",
abstract = "This paper provides a technique, based on partially observable Markov decision processes (POMDPs), for building automatic recovery controllers to guide distributed system recovery in a way that provides provable assurances on the quality of the generated recovery actions even when the diagnostic information may be imprecise. Lower bounds on the cost of recovery are introduced and proved, and it is shown how the characteristics of the recovery process can be used to ensure that the lower bounds converge even on undiscounted models. The bounds used in an appropriate online controller provide it with provable termination properties. Simulation-based experimental results on a realistic e-commerce system demonstrate that the proposed bounds can be improved iteratively, and the resulting controller convincingly outperforms a controller that uses heuristics instead of bounds.",
author = "Joshi, {Kaustubh R.} and Hiltunen, {Matti A.} and Sanders, {William H.} and Schlichting, {Richard D.}",
year = "2006",
doi = "10.1109/DSN.2006.16",
language = "English (US)",
isbn = "0769526071",
series = "Proceedings of the International Conference on Dependable Systems and Networks",
pages = "445--454",
booktitle = "Proceedings - DSN 2006",
note = "DSN 2006: 2006 International Conference on Dependable Systems and Networks ; Conference date: 25-06-2006 Through 28-06-2006",
}