@inproceedings{d6b07668885d487fb23e78a1c4fd5b67,
title = "Log Replaying for Real-Time HTAP: An Adaptive Epoch-Based Two-Stage Framework",
abstract = "As real-time analytics become increasingly important, more organizations are deploying Hybrid Transactional/An-alytical Processing (HTAP) systems. The HTAP systems, based on a primary/backup replication architecture, usually support real-time read-only queries on backup nodes for the data recently generated by OLTP applications on the primary node. This work is based on the observation that real-time analytical applications often require access to only a fraction of the latest modifications from OLTP applications. However, the state-of-the-art parallel log replay approaches treat all replicated transaction logs equally and replay the entire transaction logs with the same priority which does not take consideration into the OLAP query access pattern. This design can result in increased response latency for real-time applications. This paper presents AETS, an Adaptive Epoch-based Two-Stage log replay framework that implements epoch-based log replay and table group transaction commit. Simultaneously, AETS also takes full account of the table access priority in real-time HTAP workload log replay. It aims to make the data required by analytical queries visible more quickly. Furthermore, AETS includes a two-phase parallel log replay algorithm called TPLR, which achieves lower overhead compared to state-of-the-art algorithms through careful design. We also offer an adaptive fine-grained thread resource allocation method that considers changes in table access patterns over time under thread resource constraints. Our experimental results show that AETS significantly reduces visibility delay for real-time queries. And the results also show that AETS achieves significant replay throughput improvement.",
keywords = "HTAP, parallel log replay, replication",
author = "Zhu, \{Jun Peng\} and Zhiwei Ye and Peng Cai and Donghui Wang and Fengyan Zhang and Dunbo Cai and Ling Qian",
note = "Publisher Copyright: {\textcopyright} 2024 IEEE.; 40th IEEE International Conference on Data Engineering, ICDE 2024 ; Conference date: 13-05-2024 Through 17-05-2024",
year = "2024",
doi = "10.1109/ICDE60146.2024.00167",
language = "英语",
series = "Proceedings - International Conference on Data Engineering",
publisher = "IEEE Computer Society",
pages = "2096--2108",
booktitle = "Proceedings - 2024 IEEE 40th International Conference on Data Engineering, ICDE 2024",
address = "美国",
}