@inproceedings{a244c9d436be4ddf9497ab19b9c57ecc,
title = "Distance-aware virtual cluster performance optimization: A hadoop case study",
abstract = "Cloud computing and big data are becoming two important developing trends in information technology area. However, data-intensive computing has some challenges to work well on virtual machines in cloud computing for virtualized resource competition and complex network communication. Network becomes one of the most notorious bottlenecks, which highlights strategies to lower communication and transmission cost in virtual cluster. In this paper, we present a novel cluster performance optimization strategy named vClusterOpt. vClusterOpt finds out centralized subgraphs of node graph and choose node with the shortest logical distance as kernel node of the subgraph to reduce inter-machine communication and transmission cost under virtual cluster. To calculate logical distance accurately, we define two kinds of logical distance: Logical Communication Distance(LCD) and Logical Transmission Distance(LTD). VM with the shortest LCD with others is used as the communication kernel node who has the most information communication stress, while VM with the shortest LTD is treated as transmission kernel node who has the most data transmission stress. We choose benchmarks running on Hadoop as the represent of data-intensive computing service to demonstrate effectiveness of our approach. Experiments show that an average of 20\% performance improvement can get by our distance-aware virtual cluster optimization strategy.",
keywords = "Hadoop, big data, cloud computing, distance-aware virtual cluster, virtual machine communication",
author = "Xinkui Zhao and Jianwei Yin and Zuoning Chen and Xingjian Lu",
year = "2013",
doi = "10.1109/CLUSTER.2013.6702618",
language = "英语",
isbn = "9781479908981",
series = "Proceedings - IEEE International Conference on Cluster Computing, ICCC",
booktitle = "2013 IEEE International Conference on Cluster Computing, CLUSTER 2013",
note = "15th IEEE International Conference on Cluster Computing, CLUSTER 2013 ; Conference date: 23-09-2013 Through 27-09-2013",
}