@inproceedings{f29d335c086d4003940225b1af680188,
title = "Duplicate detection for identifying social spam in microblogs",
abstract = "As an important kind of social media, microblog has become an important source of opinion mining and collective behavior study. However, social spams may affect the analytical results greatly. This paper focuses on the problem of identifying potential social spammers who copy pieces of information from others. An improved locality-sensitive hashing based method is used for detecting duplicated tweets. Intensive empirical study over a real-life microblog dataset crawled from Sina Weibo, one of the most popular microblogging services, is conducted. The characteristics of potential spammers and their behaviors are analyzed.",
keywords = "MapReduce, duplicate detection, locality-sensitive hash, microblog, social spam",
author = "Qunyan Zhang and Haixin Ma and Weining Qian and Aoying Zhou",
year = "2013",
doi = "10.1109/BigData.Congress.2013.27",
language = "英语",
isbn = "9780768550060",
series = "Proceedings - 2013 IEEE International Congress on Big Data, BigData 2013",
pages = "141--148",
booktitle = "Proceedings - 2013 IEEE International Congress on Big Data, BigData 2013",
note = "2013 IEEE International Congress on Big Data, BigData 2013 ; Conference date: 27-06-2013 Through 02-07-2013",
}