@inproceedings{5b3f73455a824681b8202c9d3b6a1fe1,
title = "Filtering with the crowd: Crowdscreen revisited",
abstract = "Filtering a set of items, based on a set of properties that can be verified by humans, is a common application of CrowdSourcing. When the workers are error-prone, each item is presented to multiple users, to limit the probability of misclassification. Since the Crowd is a relatively expensive resource, minimizing the number of questions per item may naturally result in big savings. Several algorithms to address this minimization problem have been presented in the CrowdScreen framework by Parameswaran et al. However, those algorithms do not scale well and therefore cannot be used in scenarios where high accuracy is required in spite of high user error rates. The goal of this paper is thus to devise algorithms that can cope with such situations. To achieve this, we provide new theoretical insights to the problem, then use them to develop a new efficient algorithm. We also propose novel optimizations for the algorithms of CrowdScreen that improve their scalability. We complement our theoretical study by an experimental evaluation of the algorithms on a large set of synthetic parameters as well as real-life crowdsourcing scenarios, demonstrating the advantages of our solution.",
keywords = "Algorithms, CrowdSourcing, Filtering, Hypothesis Testing, Sprt",
author = "Beno{\^i}t Groz and Ezra Levin and Isaac Meilijson and Tova Milo",
note = "Publisher Copyright: {\textcopyright}2016 Beno{\^i}t Groz, Ezra Levin, Isaac Meilijson, and Tova Milo.; null ; Conference date: 15-03-2016 Through 18-03-2016",
year = "2016",
month = mar,
day = "1",
doi = "10.4230/LIPIcs.ICDT.2016.12",
language = "אנגלית",
series = "Leibniz International Proceedings in Informatics, LIPIcs",
publisher = "Schloss Dagstuhl- Leibniz-Zentrum fur Informatik GmbH, Dagstuhl Publishing",
editor = "Thomas Zeume and Wim Martens",
booktitle = "19th International Conference on Database Theory, ICDT 2016",
}