@inproceedings{63e73ae7bc3b4690af3609f24066244c,
title = "Exploiting Unblocking Checkpoint for Fault-Tolerance in Pregel-Like Systems",
abstract = "With the explosive growth of graph size, a series of Pregel-like systems have emerged. Typically, these systems employ checkpointing and rollback mechanisms to achieve fault-tolerance in either blocking or unblocking manner. The blocking checkpointing pauses the iterative processing while checkpointing, whereas the unblocking checkpointing writes the checkpoints in parallel with the iterative processing. The unblocking checkpointing decreases the checkpointing overhead, but incurs resource contention due to checkpointing concurrently. Hence, it may prolong the time on execution and checkpointing. In this work, we propose a queuing strategy to alleviate the contention. This strategy employs a checkpoint queue to store all the pending checkpoints, which allows to concurrently write a certain number of checkpoints at most from the queue following a First-In-First-Out (FIFO) policy. To further utilize the characteristics of checkpoint in Pregel-like systems, we define checkpoint staleness and checkpoint tardiness, and then propose staleness/tardiness-aware skipping policy to replace the FIFO policy. Extensive experiments verified that the queuing strategy with the skipping policy outperforms blocking and unblocking checkpointing in Pregel-like systems.",
keywords = "Checkpoint, Fault tolerance, Graph processing",
author = "Yi Yang and Zhenhua Yang and Chen Xu",
note = "Publisher Copyright: {\textcopyright} 2021, Springer Nature Switzerland AG.; 22nd International Conference on Web Information Systems Engineering, WISE 2021 ; Conference date: 26-10-2021 Through 29-10-2021",
year = "2021",
doi = "10.1007/978-3-030-90888-1\_6",
language = "英语",
isbn = "9783030908874",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "71--86",
editor = "Wenjie Zhang and Lei Zou and Zakaria Maamar and Lu Chen",
booktitle = "Web Information Systems Engineering - WISE 2021 - 22nd International Conference on Web Information Systems Engineering, WISE 2021, Proceedings",
address = "德国",
}