@inproceedings{739b46ff492444f083991069ccc8d587,
title = "Leveraging attributes and crowdsourcing for join",
abstract = "Join operation is usually hard to achieve high quality with machine alone. We adopt crowdsourcing to improve the quality of join. Depending on the number of generated pairs, the overall cost can be expensive for hiring workers to do the verification. We propose a hybrid approach to generate pairs by leveraging attributes, which combines category, sorting and clustering techniques, called CSCER. We also propose an adaptive attribute-selection strategy to efficiently generate pairs based on attributes. Experiments on a real crowdsourcing platform using real datasets indicate that our approaches save the overall cost compared to existing methods and achieve high quality of join results.",
author = "Jianhong Feng and Jianhua Feng and Huiqi Hu",
year = "2014",
doi = "10.1007/978-3-319-08010-9\_47",
language = "英语",
isbn = "9783319080093",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "448--452",
booktitle = "Web-Age Information Management - 15th International Conference, WAIM 2014, Proceedings",
address = "德国",
note = "15th International Conference on Web-Age Information Management, WAIM 2014 ; Conference date: 16-06-2014 Through 18-06-2014",
}