@inproceedings{3dbc8dc48c7349249c1460ea4bdf8da0,
title = "Crowd IQ: Measuring the intelligence of crowdsourcing platforms",
abstract = "We measure crowdsourcing performance based on a standard IQ questionnaire, and examine Amazon's Mechanical Turk (AMT) performance under different conditions. These include variations of the payment amount offered, the way incorrect responses affect workers' reputations, threshold reputation scores of participating AMT workers, and the number of workers per task. We show that crowds composed of workers of high reputation achieve higher performance than low reputation crowds, and the effect of the amount of payment is non-monotone-both paying too much and too little affects performance. Furthermore, higher performance is achieved when the task is designed such that incorrect responses can decrease workers' reputation scores. Using majority vote to aggregate multiple responses to the same task can significantly improve performance, which can be further boosted by dynamically allocating workers to tasks in order to break ties.",
keywords = "Crowdsourcing, Incentive schemes, Psychometrics",
author = "Michal Kosinski and Yoram Bachrach and Gjergji Kasneci and Jurgen Van-Gael and Thore Graepel",
year = "2012",
doi = "10.1145/2380718.2380739",
language = "English",
isbn = "9781450312288",
series = "Proceedings of the 4th Annual ACM Web Science Conference, WebSci'12",
publisher = "Association for Computing Machinery",
pages = "151--160",
booktitle = "Proceedings of the 4th Annual ACM Web Science Conference, WebSci'12",
note = "4th Annual ACM Web Science Conference, WebSci 2012 ; Conference date: 22-06-2012 Through 24-06-2012",
}