@inproceedings{1fddad0d9a2e4441b59417a3621fb794,
title = "Libckpt: Transparent checkpointing under Unix",
abstract = "Checkpointing is a simple technique for rollback recovery: the state of an executing program is periodically saved to a disk file from which it can be recovered after a failure. While recent research has developed a collection of powerful techniques for minimizing the overhead of writing checkpoint files, checkpointing remains unavailable to most application developers. In this paper we describe libckpt, a portable checkpointing tool for Unix that implements all applicable performance optimizations which are reported in the literature. While libckpt can be used in a mode which is almost totally transparent to the programmer, it also supports the incorporation of user directives into the creation of checkpoints. This user-directed checkpointing is an innovation which is unique to our work.",
author = "Plank, {James S.} and Micah Beck and Gerry Kingsley and Kai Li",
note = "Funding Information: The authors thank Jian Xu, Jack Dongarra, Christian Halloy, and the National Center for Atmospheric Research for help in obtaining test programs. We also thank Nitin Vaidya, Mootaz Elnozahy, Heather Booth, and the referees for their valuable comments. James Plank is supported by NSF grant CCR-9409496. Kai Li is supported by ARPA and ONR under contracts N00014-91-J-4039, and Intel Supercomputer Systems Division.; USENIX 1995 Technical Conference ; Conference date: 16-01-1995 Through 20-01-1995",
year = "1995",
language = "English (US)",
series = "USENIX 1995 Technical Conference Proceedings",
publisher = "USENIX Association",
booktitle = "USENIX 1995 Technical Conference Proceedings",
}