@inproceedings{f3233af97d6e4e7bba2a46e9e5e1fe2b,
title = "Flexible and adaptive stream join algorithm",
abstract = "Flexibility and self-adaptivity are important to real-time join processing in a parallel shared-nothing environment. Join-Matrix is a high-performance model on distributed stream joins and supports arbitrary join predicates. It can handle data skew perfectly since it randomly routes tuples to cells with each steam corresponding to one side of the matrix. Designing of the partitioning scheme of the matrix is a determining factor to maximize system throughputs under the premise of economizing computing resources. In this paper, we propose a novel flexible and adaptive scheme partitioning algorithm for stream join operator, which ensures high throughput but with economical resource usages by allocating resources on demand. Specifically, a lightweight scheme generator, which requires the sample of each stream volume and processing resource quota of each physical machine, generates a join scheme; then a migration plan generator decides how to migrate data among machines under the consideration of minimizing migration cost while ensuring correctness. Extensive experiments are done on different kind of join workloads and show high competence comparing with baseline systems on benchmark.",
author = "Junhua Fang and Xiaotong Wang and Rong Zhang and Aoying Zhou",
note = "Publisher Copyright: {\textcopyright} Springer International Publishing Switzerland 2016.",
year = "2016",
doi = "10.1007/978-3-319-45817-5\_1",
language = "英语",
isbn = "9783319458168",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "3--16",
editor = "Kyuseok Shim and Kai Zheng and Guanfeng Liu and Feifei Li",
booktitle = "Web Technologies and Applications - 18th Asia-Pacific Web Conference, APWeb 2016, Proceedings",
address = "德国",
}