@inproceedings{c76c58fc666b4ac6bb3598ebcbb927e6,
title = "Distributed SLCA-based XML keyword search by map-reduce",
abstract = "Large scales of XML information comes continually from new Web applications, and SLCA (Smallest Lowest Common Ancestor)-based XML keyword search is one of the most important information retrieval approaches. Previous approaches focus on building index for XML documents. However in information dissemination scenario, it is impossible to build index in advance for continuous XML document streams. This paper addresses SLCA-based keyword search for continuous XML documents by Map-Reduce mechanism. We use parallel algorithms to process plenty of XML documents in Hadoop environment. A distributed SLCA computation method is designed, where each net node computes SLCA independently and just a little information needs be transmitted. A real Hadoop environment is built and we demonstrate the efficiency of our algorithms analytically and experimentally.",
keywords = "SLCA, XML, distributed system, keyword search",
author = "Chenjing Zhang and Qiang Ma and Xiaoling Wang and Aoying Zhou",
year = "2010",
doi = "10.1007/978-3-642-14589-6\_40",
language = "英语",
isbn = "3642145884",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
pages = "386--397",
booktitle = "Database Systems for Advanced Applications - 15th International Conference, DASFAA 2010, International Workshops",
note = "15th International Conference on Database Systems for Advanced Applications, DASFAA 2010 ; Conference date: 01-04-2010 Through 04-04-2010",
}