@inproceedings{8b577fd568a544bf815fff7e32bb5983,
title = "Roll-forward and rollback recovery: Performance-reliability trade-off",
abstract = "Performance and reliability achieved by a modular redundant system depend on the recovery scheme used. Typically, gain in performance using comparable resources results in reduced reliability. Several high-performance computers are noted for small mean time to failure. Performance is measured here in terms of mean and variance of the task completion time, reliability being a task-based measure defined as the probability that a task is completed correctly. Two roll-forward schemes are compared with two rollback schemes for achieving recovery in duplex systems. The roll-forward schemes discussed here are based on a roll-forward checkpointing concept proposed in [5-8]. Roll-forward recovery schemes achieve significantly better performance than rollback schemes by avoiding rollback in most common fault scenarios. It is shown that the roll-forward schemes improve performance with only a small loss in reliability as compared to rollback schemes.",
author = "Pradhan, {Dhiraj K.} and Vaidya, {Nitin H.}",
year = "1994",
language = "English (US)",
isbn = "0818655224",
series = "Digest of Papers - International Symposium on Fault-Tolerant Computing",
publisher = "Publ by IEEE",
pages = "186--195",
booktitle = "Digest of Papers - International Symposium on Fault-Tolerant Computing",
note = "Proceedings of the 24th International Symposium on Fault-Tolerant Computing ; Conference date: 15-06-1994 Through 17-06-1994",
}