CINXE.COM
Mechanical Turk: Now with 40.92% spam. - A Computer Scientist in a Business School
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> <html dir="ltr" xmlns="http://www.w3.org/1999/xhtml" xmlns:b="http://www.google.com/2005/gml/b" xmlns:data="http://www.google.com/2005/gml/data" xmlns:expr="http://www.google.com/2005/gml/expr"> <head><script type="text/javascript" src="https://web-static.archive.org/_static/js/bundle-playback.js?v=7YQSqjSh" charset="utf-8"></script> <script type="text/javascript" src="https://web-static.archive.org/_static/js/wombat.js?v=txqj7nKC" charset="utf-8"></script> <script>window.RufflePlayer=window.RufflePlayer||{};window.RufflePlayer.config={"autoplay":"on","unmuteOverlay":"hidden"};</script> <script type="text/javascript" src="https://web-static.archive.org/_static/js/ruffle/ruffle.js"></script> <script type="text/javascript"> __wm.init("https://web.archive.org/web"); __wm.wombat("http://behind-the-enemy-lines.blogspot.com/2010/12/mechanical-turk-now-with-4092-spam.html","20101229083934","https://web.archive.org/","web","https://web-static.archive.org/_static/", "1293611974"); </script> <link rel="stylesheet" type="text/css" href="https://web-static.archive.org/_static/css/banner-styles.css?v=p7PEIJWi" /> <link rel="stylesheet" type="text/css" href="https://web-static.archive.org/_static/css/iconochive.css?v=3PDvdIFv" /> <!-- End Wayback Rewrite JS Include --> <meta content="KYOVwFLhv8faPO87h6QtiFWYqf7oEerv/1lt4haDxMk=" name="verify-v1"/> <meta content="text/html; charset=UTF-8" http-equiv="Content-Type"/> <script type="text/javascript">(function() { var a=window;function c(b){this.t={};this.tick=function(d,i,e){e=e?e:(new Date).getTime();this.t[d]=[e,i]};this.tick("start",null,b)}var f=new c;a.jstiming={Timer:c,load:f};try{var g=null;if(a.chrome&&a.chrome.csi)g=Math.floor(a.chrome.csi().pageT);if(g==null)if(a.gtbExternal)g=a.gtbExternal.pageT();if(g==null)if(a.external)g=a.external.pageT;if(g)a.jstiming.pt=g}catch(h){};a.tickAboveFold=function(b){b=b;var d=0;if(b.offsetParent){do d+=b.offsetTop;while(b=b.offsetParent)}b=d;b<=750&&a.jstiming.load.tick("aft")};var j=false;function k(){if(!j){j=true;a.jstiming.load.tick("firstScrollTime")}}a.addEventListener?a.addEventListener("scroll",k,false):a.attachEvent("onscroll",k); })();</script> <meta content="true" name="MSSmartTagsPreventParsing"/> <meta content="blogger" name="generator"/> <link href="https://web.archive.org/web/20101229083934im_/http://www.blogger.com/favicon.ico" rel="icon" type="image/vnd.microsoft.icon"/> <link href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/12/mechanical-turk-now-with-4092-spam.html" rel="canonical"/> <link rel="alternate" type="application/atom+xml" title="A Computer Scientist in a Business School - Atom" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/feeds/posts/default"/> <link rel="alternate" type="application/rss+xml" title="A Computer Scientist in a Business School - RSS" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/feeds/posts/default?alt=rss"/> <link rel="service.post" type="application/atom+xml" title="A Computer Scientist in a Business School - Atom" href="http://www.blogger.com/feeds/7118563403027467631/posts/default"/> <link rel="EditURI" type="application/rsd+xml" title="RSD" href="http://www.blogger.com/rsd.g?blogID=7118563403027467631"/> <link rel="alternate" type="application/atom+xml" title="A Computer Scientist in a Business School - Atom" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/feeds/2428602678035046823/comments/default"/> <link rel="image_src" href="https://web.archive.org/web/20101229083934im_/http://2.bp.blogspot.com/_skxW9kDLt_c/TQpWpze7-VI/AAAAAAAAfn0/02yFP0s79eQ/s72-c/spam-vs-notspam.PNG"/> <!--[if IE]> <script> (function() { var html5 = ("abbr,article,aside,audio,canvas,datalist,details," + "figure,footer,header,hgroup,mark,menu,meter,nav,output," + "progress,section,time,video").split(','); for (var i = 0; i < html5.length; i++) { document.createElement(html5[i]); } })(); </script> <![endif]--> <title>Mechanical Turk: Now with 40.92% spam. - A Computer Scientist in a Business School</title> <link type="text/css" rel="stylesheet" href="https://web.archive.org/web/20101229083934cs_/http://www.blogger.com/static/v1/widgets/1743847221-widget_css_bundle.css"/> <link rel="stylesheet" type="text/css" href="https://web.archive.org/web/20101229083934cs_/http://www.blogger.com/dyn-css/authorization.css?targetBlogID=7118563403027467631&zx=7e79aab4-3ca6-466b-8dcf-11a4ec63181e"/> <style type="text/css">#navbar-iframe { display:block } </style> <style id="page-skin-1" type="text/css"><!-- /* ----------------------------------------------- Blogger Template Style Name: Thisaway Date: 29 Feb 2004 Updated by: Blogger Team ----------------------------------------------- */ /* Variable definitions ==================== <Variable name="textColor" description="Text Color" type="color" default="#634320"> <Variable name="blogTitleColor" description="Blog Title Color" type="color" default="#fef6ee"> <Variable name="blogDescriptionColor" description="Blog Description Color" type="color" default="#fef6ee"> <Variable name="postTitleColor" description="Post Title Color" type="color" default="#ba8247"> <Variable name="dateHeaderColor" description="Date Header Color" type="color" default="#c8ab8f"> <Variable name="sidebarHeaderColor" description="Sidebar Title Color" type="color" default="#bd9e80"> <Variable name="mainLinkColor" description="Link Color" type="color" default="#bf4e27"> <Variable name="mainVisitedLinkColor" description="Visited Link Color" type="color" default="#8f3213"> <Variable name="sidebarLinkColor" description="Sidebar Link Color" type="color" default="#e2a059"> <Variable name="sidebarVisitedLinkColor" description="Sidebar Visited Link Color" type="color" default="#ba742a"> <Variable name="bodyFont" description="Text Font" type="font" default="normal normal 100% Helvetica,Arial,Verdana,'Trebuchet MS', Sans-serif"> <Variable name="headerFont" description="Sidebar Title Font" type="font" default="normal bold 100% Helvetica,Arial,Verdana,'Trebuchet MS', Sans-serif"> <Variable name="pageTitleFont" description="Blog Title Font" type="font" default="normal bold 200% Helvetica,Arial,Verdana,'Trebuchet MS', Sans-serif"> <Variable name="blogDescriptionFont" description="Blog Description Font" type="font" default="normal normal 80% Helvetica,Arial,Verdana,'Trebuchet MS', Sans-serif"> <Variable name="startSide" description="Start side in blog language" type="automatic" default="left"> <Variable name="endSide" description="End side in blog language" type="automatic" default="right"> */ /* global ----------------------------------------------- */ body { margin: 0; text-align: center; min-width: 760px; background: #ce8b43 url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/bg_body.gif) repeat-x left top; color: #634320; font-size: small; } blockquote { margin: 0; padding-top: 0; padding-right: 10px; padding-bottom: 0; padding-left: 10px; border-left: 6px solid #f7e8d8; border-right: 6px solid #f7e8d8; color: #ba8247; } code { color: #ba8247; } hr { display: none; } /* layout ----------------------------------------------- */ #outer-wrapper { margin: 0 auto; width: 760px; text-align: left; font: normal normal 100% Helvetica,Arial,Verdana,'Trebuchet MS', Sans-serif; } #header-wrapper { padding-bottom: 15px; background: url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/bg_header_bottom.gif) no-repeat left bottom; } #header { background: #634320 url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/bg_header.gif) repeat-x left bottom; } #content-wrapper { position: relative; width: 760px; background: #f7f0e9 url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/bg_main_wrapper.gif) repeat-y left top; } #main-wrapper { display: inline; /* fixes a strange ie margin bug */ float: left; margin-top: 0; margin-right: 0; margin-bottom: 0; margin-left: 3px; padding: 0; width: 483px; word-wrap: break-word; /* fix for long text breaking sidebar float in IE */ overflow: hidden; /* fix for long non-text content breaking IE sidebar float */ } #main { padding-top: 22px; padding-right: 8px; padding-bottom: 0; padding-left: 8px; background: url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/bg_content.gif) repeat-x left top; } .post { margin-top: 0; margin-right: 8px; margin-bottom: 14px; margin-left: 21px; padding: 0; border-bottom: 3px solid #f7e8d8; } #comments { margin-top: 0; margin-right: 16px; margin-bottom: 14px; margin-left: 29px; padding: 10px; border: 1px solid #f0e0ce; background-color: #f5ede4; } #sidebar-wrapper { display: inline; /* fixes a strange ie margin bug */ float: right; margin-top: 0; margin-right: 3px; margin-bottom: 0; margin-left: 0; width: 269px; color: #634320; line-height: 1.4em; font-size: 90%; background: url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/bg_sidebar.gif) repeat-x left top; word-wrap: break-word; /* fix for long text breaking sidebar float in IE */ overflow: hidden; /* fix for long non-text content breaking IE sidebar float */ } #sidebar { padding-top: 7px; padding-right: 11px; padding-bottom: 0; padding-left: 14px; background: url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/bg_sidebar_arrow.gif) repeat-y 179px 0; } #sidebar .widget { margin-bottom: 20px; } #footer-wrapper { padding-top: 15px; background: url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/bg_footer_top.gif) no-repeat left top; clear: both; } #footer { background: #493015 url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/bg_footer.gif) repeat-x left top; text-align: center; min-height: 2em; } /* headings ----------------------------------------------- */ #header h1 { margin: 0; padding-top: 24px; padding-right: 0; padding-bottom: 0; padding-left: 84px; background: url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/icon_header_left.gif) no-repeat 16px 26px; } h2.date-header { margin: 0; padding-top: 0; padding-right: 0; padding-bottom: 0; padding-left: 29px; text-transform: uppercase; color: #c8ab8f; background: url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/icon_date.gif) no-repeat 13px 0; font-size: 80%; font-weight: normal; } .date-header span { margin-top: 0; margin-right: 0; margin-bottom: 0; margin-left: 5px; padding-top: 0; padding-right: 25px; padding-bottom: 0; padding-left: 25px; background: url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/bg_date.gif) no-repeat left 0; } .sidebar h2 { padding-top: 1px; padding-right: 0; padding-bottom: 0; padding-left: 36px; color: #bd9e80; background: url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/icon_sidebar_heading_left.gif) no-repeat left 45%; font: normal bold 100% Helvetica,Arial,Verdana,'Trebuchet MS', Sans-serif; } .sidebar .Profile h2 { color: #957252; background: url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/icon_sidebar_profileheading_left.gif) no-repeat left 45%; } .post h3 { margin-top: 13px; margin-right: 0; margin-bottom: 13px; margin-left: 0; padding: 0; color: #ba8247; font-size: 140%; } .post h3 a, .post h3 a:visited { color: #ba8247; } #comments h4 { margin-top: 0; font-size: 120%; } /* text ----------------------------------------------- */ #header h1 { color: #fef6ee; font: normal bold 200% Helvetica,Arial,Verdana,'Trebuchet MS', Sans-serif; } #header .description { margin: 0; padding-top: 7px; padding-right: 16px; padding-bottom: 0; padding-left: 84px; color: #fef6ee; font: normal normal 80% Helvetica,Arial,Verdana,'Trebuchet MS', Sans-serif; } .post-body p { line-height: 1.4em; /* Fix bug in IE5/Win with italics in posts */ margin: 0; height: 1%; overflow: visible; } .post-footer { font-size: 80%; color: #c8ab8f; } .uncustomized-post-template .post-footer { text-align: right; } .uncustomized-post-template .post-footer .post-author, .uncustomized-post-template .post-footer .post-timestamp { display: block; float: left; text-align: left; margin-right: 4px; } p.comment-author { font-size: 83%; } .deleted-comment { font-style:italic; color:gray; } .comment-body p { line-height: 1.4em; } .feed-links { clear: both; line-height: 2.5em; margin-bottom: 0.5em; margin-left: 29px; } #footer .widget { margin: 0; padding-top: 0; padding-right: 0; padding-bottom: 15px; padding-left: 55px; color: #fef6ee; font-size: 90%; line-height: 1.4em; background: url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/icon_footer.gif) no-repeat 16px 0; } /* lists ----------------------------------------------- */ .post ul { padding-left: 32px; list-style-type: none; line-height: 1.4em; } .post li { padding-top: 0; padding-right: 0; padding-bottom: 4px; padding-left: 17px; background: url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/icon_list_item_left.gif) no-repeat left 3px; } #comments ul { margin: 0; padding: 0; list-style-type: none; } #comments li { padding-top: 0; padding-right: 0; padding-bottom: 1px; padding-left: 17px; background: url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/icon_comment_left.gif) no-repeat left 3px; } .sidebar ul { padding: 0; list-style-type: none; line-height: 1.2em; margin-left: 0; } .sidebar li { padding-top: 0; padding-right: 0; padding-bottom: 4px; padding-left: 17px; background: url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/icon_list_item.gif) no-repeat left 3px; } #blog-pager-newer-link { float: left; margin-left: 29px; } #blog-pager-older-link { float: right; margin-right: 16px; } #blog-pager { text-align: center; } /* links ----------------------------------------------- */ a { color: #bf4e27; font-weight: bold; } a:hover { color: #8f3213; } a.comment-link { /* ie5.0/win doesn't apply padding to inline elements, so we hide these two declarations from it */ background/* */:/**/url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/icon_comment_left.gif) no-repeat left 45%; padding-left: 14px; } html>body a.comment-link { /* respecified, for ie5/mac's benefit */ background: url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway/icon_comment_left.gif) no-repeat left 45%; padding-left: 14px; } .sidebar a { color: #e2a059; } .sidebar a:hover { color: #ba742a; } #header h1 a { color: #fef6ee; text-decoration: none; } #header h1 a:hover { color: #d9c6b4; } .post h3 a { text-decoration: none; } a img { border-width: 0; } .clear { clear: both; line-height: 0; height: 0; } .profile-textblock { clear: both; margin-bottom: 10px; margin-left: 0; } .profile-img { float: left; margin-top: 0; margin-right: 5px; margin-bottom: 5px; margin-left: 0; padding: 3px; border: 1px solid #ebd4bd; } .profile-link { padding-top: 0; padding-right: 0; padding-bottom: 0; padding-left: 17px; background: url(https://web.archive.org/web/20101229083934im_/http://www.blogblog.com/thisaway_blue/icon_profile_left.gif) no-repeat left 0; } /** Page structure tweaks for layout editor wireframe */ body#layout #main, body#layout #sidebar { padding: 0; } --></style> <script type="text/javascript"> var _gaq = _gaq || []; _gaq.push(['_setAccount', 'UA-89122-10']); _gaq.push(['_trackPageview']); (function() { var ga = document.createElement('script'); ga.src = ('https:' == document.location.protocol ? 'https://web.archive.org/web/20101229083934/https://ssl' : 'https://web.archive.org/web/20101229083934/http://www') + '.google-analytics.com/ga.js'; ga.setAttribute('async', 'true'); document.documentElement.firstChild.appendChild(ga); })(); </script> <script type="text/javascript"> if (window.jstiming) window.jstiming.load.tick('headEnd'); </script></head> <body> <div class="navbar section" id="navbar"><div class="widget Navbar" id="Navbar1"><script type="text/javascript"> function setAttributeOnload(object, attribute, val) { if(window.addEventListener) { window.addEventListener("load", function(){ object[attribute] = val; }, false); } else { window.attachEvent('onload', function(){ object[attribute] = val; }); } } </script> <iframe src="https://web.archive.org/web/20101229083934if_/http://www.blogger.com/navbar.g?targetBlogID=7118563403027467631&blogName=A+Computer+Scientist+in+a+Business+Sc...&publishMode=PUBLISH_MODE_BLOGSPOT&navbarType=SILVER&layoutType=LAYOUTS&searchRoot=http%3A%2F%2Fbehind-the-enemy-lines.blogspot.com%2Fsearch&blogLocale=en_US&homepageUrl=http%3A%2F%2Fbehind-the-enemy-lines.blogspot.com%2F&targetPostID=2428602678035046823" marginwidth="0" marginheight="0" scrolling="no" frameborder="0" height="30px" width="100%" id="navbar-iframe" allowtransparency="true" title="Blogger Navigation and Search"></iframe> <div></div></div></div> <div id="outer-wrapper"><div id="wrap2"> <!-- skip links for text browsers --> <span id="skiplinks" style="display:none;"> <a href="#main">skip to main </a> | <a href="#sidebar">skip to sidebar</a> </span> <div id="header-wrapper"> <div class="header section" id="header"><div class="widget Header" id="Header1"> <div id="header-inner"> <div class="titlewrapper"> <h1 class="title"> <a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/">A Computer Scientist in a Business School</a> </h1> </div> <div class="descriptionwrapper"> <p class="description"><span>Thoughts and stories of a computer scientist in a business school.</span></p> </div> </div> </div></div> </div> <div id="content-wrapper"> <div id="crosscol-wrapper" style="text-align:center"> <div class="crosscol section" id="crosscol"></div> </div> <div id="main-wrapper"> <div class="main section" id="main"><div class="widget Blog" id="Blog2"> <div class="blog-posts hfeed"> <!-- google_ad_section_start(name=default) --> <div class="date-outer"> <h2 class="date-header"><span>Thursday, December 16, 2010</span></h2> <div class="date-posts"> <div class="post-outer"> <div class="post"> <a name="2428602678035046823"></a> <h3 class="post-title"> <a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/12/mechanical-turk-now-with-4092-spam.html">Mechanical Turk: Now with 40.92% spam.</a> </h3> <div class="post-header-line-1"></div> <div class="post-body"> <p>At this point, <a href="https://web.archive.org/web/20101229083934/https://www.mturk.com/mturk/findhits?match=false">Amazon Mechanical Turk</a> has reached the mainstream. Pretty much everyone knows about the concept. Post small tasks online, pay people cents, and get thousands of micro-tasks completed.<br/> <br/> Unfortunately, this resulted in some unfortunate trends. Anyone who frequents just a little bit the market will notice the tremendous number of spammy HITs. (HIT = a task posted for completion in the market; stands for Human Intelligence Task). "Test if the ads in my website work". "Create a Twitter account and follow me". "Like my YouTube video". "Download this app". "Write a positive review on Yelp". A seemingly endless amount of spam HITs come to the market, mainly with the purpose of spamming "social media" metrics.<br/> <hr align="center" style="background-color: #691f01; border: 1px; color: #691f01; display: block; height: 2px;" width="50%"/><br/> So, with <a href="https://web.archive.org/web/20101229083934/http://dahn.tamir.com/">Dahn Tamir</a> and <a href="https://web.archive.org/web/20101229083934/http://www.linkedin.com/in/priyakanth">Priya Kanth</a> (MS student at NYU), we decided to examine how big is the problem. How many spammers join the market? How many spam HITs are there?<br/> <br/> Using the data from <a href="https://web.archive.org/web/20101229083934/http://www.mturk-tracker.com/general/">Mechanical Turk Tracker</a>, we picked all the requesters that first joined the market in September 2010 and October 2010. Why new ones? Because we assumed that long term requesters are not spammers. (But this remains to be verified.)<br/> <br/> This process resulted in 1733 new requesters that first appeared in the marketplace in September and October 2010. We then took all the HITs that these requesters posted in the market. This was a total of 5842 HIT groups. The activity patterns of the new requesters were similar to those of the general requester population.<br/> <br/> <hr align="center" style="background-color: #691f01; border: 1px; color: #691f01; display: block; height: 2px;" width="50%"/><br/> The next step was to post these HITs on Mechanical Turk, and asked workers to classify them as spam or not, using the following guidelines:<br/> <br/> <table border="1"><tbody> <tr><td><blockquote><br/> Use the following guidelines to classify the HIT as SPAM: <br/> <ul><li><b>SEO</b>: Asks me to give a fake rating, vote, review, comment, or "like" on Facebook, YouTube, DIGG, etc., or to create fake mail or website accounts.</li> <li><b>Fake accounts</b>: Asks me to create an account on Twitter, Facebook, and then perform a likely spam action. </li> <li><b>Lead Gen</b>: Asks me to go to a website and sign up for a trial, complete an offer, fill out a form requesting information, "test" a data-entry form, etc.</li> <li><b>Fake clicks</b>: Asks me to go to a website and click on ads.</li> <li><b>Fake ads</b>: Asks me to post an ad to Craigslist or other marketplace.</li> <li><b>Personal Info</b>: Asks me for my real name, phone number, full mailing address or email.</li> <li>You can also use your intuition to classify the HIT</li> </ul>Please DO NOT classify as spam, HITs that are legitimate in nature but priced offensively low.</blockquote></td></tr> </tbody></table><br/> Interestingly enough, we got a ridiculous amount of spam from the worker side. Even with 99% approval rate and 1000 HITs as qualification, we got plenty of spammers giving us random data.<br/> <br/> Since spam was a big problem, we posted the HIT using CrowdFlower and we used a set of 100 manually classified HITs as gold. (Without Crowdflower, we had to manually kick out the spammers and repost the HITs. So, Crowdflower saved the day.)<br/> <br/> We asked 11 workers to classify each HIT, and we ignored votes from the untrusted workers (that failed to answer correctly at least 75% of the gold tests). So, with 11 trusted workers working on each HIT, we were reasonably sure that the majority vote across these 11 votes resulted in an accurate HIT classification.<br/> <br/> I also ran the "<a href="https://web.archive.org/web/20101229083934/http://code.google.com/p/get-another-label/">get another label</a>" code and I noticed that all the workers were of reasonable quality. Since the results were similar to those of the majority vote, I decided to keep things simple and go with the majority vote as the correct answer.<br/> <br/> <hr align="center" style="background-color: #691f01; border: 1px; color: #691f01; display: block; height: 2px;" width="50%"/><br/> <b>The results</b><br/> <br/> The results were disturbing. <b>Out of the total of 5841 HITs, a total of 2390 HITs, or 40.92% were marked as spam HITs.</b><br/> <b><br/> </b><br/> <div class="separator" style="clear: both; text-align: center;"><a href="https://web.archive.org/web/20101229083934/http://2.bp.blogspot.com/_skxW9kDLt_c/TQpWpze7-VI/AAAAAAAAfn0/02yFP0s79eQ/s1600/spam-vs-notspam.PNG" imageanchor="1" style="margin-left: 1em; margin-right: 1em;"><img border="0" src="https://web.archive.org/web/20101229083934im_/http://2.bp.blogspot.com/_skxW9kDLt_c/TQpWpze7-VI/AAAAAAAAfn0/02yFP0s79eQ/s1600/spam-vs-notspam.PNG"/></a></div><b><br/> </b><br/> This is not good! 40% of the HITs from new requesters are spam!<br/> <br/> Our next test was to examine whether there are accounts that post a mix of spam and not spam HITs. The analysis indicated that this is not the case. Very few accounts post both spam HITs and legitimate HITs:<br/> <br/> <div class="separator" style="clear: both; text-align: center;"><a href="https://web.archive.org/web/20101229083934/http://3.bp.blogspot.com/_skxW9kDLt_c/TQmaiAORwnI/AAAAAAAAfnI/jo5vgvXRT04/s1600/spam-percentage-per-requester.PNG" imageanchor="1" style="margin-left: 1em; margin-right: 1em;"><img border="0" height="267" src="https://web.archive.org/web/20101229083934im_/http://3.bp.blogspot.com/_skxW9kDLt_c/TQmaiAORwnI/AAAAAAAAfnI/jo5vgvXRT04/s400/spam-percentage-per-requester.PNG" width="400"/></a></div><div class="separator" style="clear: both; text-align: center;"><br/> </div><div class="separator" style="clear: both; text-align: center;"><br/> </div>The plot illustrates that <b>31.83% of the new requesters post only spam HITs</b>.<br/> <br/> In total, 757 out of the 1733 new requesters posted at least a one spam HIT, and 552 accounts were posting only spam HITs. 56.46% of the new requesters post no spam HITs. This nice separation indicates that it is easy to separate spam requesters from legitimate ones. There are not that many requesters that post both spam HITs and legitimate ones.<br/> <br/> <b>So, 31.8% of the new requesters are clear spammers, and 40.92% of the new HITs are spam-related! </b>This is clearly a problem. <br/> <br/> <hr align="center" style="background-color: #691f01; border: 1px; color: #691f01; display: block; height: 2px;" width="50%"/><br/> <b>Spam HITs and pricing</b><br/> <b><br/> </b><br/> So, what are the quantitative characteristics of the spam HITs?<br/> <br/> First of all, they tend to contain much fewer "HITs available" compared to the legitimate HITs. 95% of the spam HITs contain just a single HIT, while only 75% of the legitimate HITs have one HIT available.<br/> <b><br/> </b><br/> <br/> <div class="separator" style="clear: both; text-align: center;"><a href="https://web.archive.org/web/20101229083934/http://4.bp.blogspot.com/_skxW9kDLt_c/TQqHqcz4FpI/AAAAAAAAfn4/aOjeQqaeaF8/s1600/hits_available_spam_not_spam.PNG" imageanchor="1" style="margin-left: 1em; margin-right: 1em;"><img border="0" height="241" src="https://web.archive.org/web/20101229083934im_/http://4.bp.blogspot.com/_skxW9kDLt_c/TQqHqcz4FpI/AAAAAAAAfn4/aOjeQqaeaF8/s400/hits_available_spam_not_spam.PNG" width="400"/></a></div><br/> <div class="separator" style="clear: both; text-align: center;"><br/> </div>On the other hand, spammers tend to post HITs with higher rewards (perhaps because they do not pay?). Approximately 80% of the legitimate HITs are priced below one dollar, while only 60% of the spam HITs are priced below this threshold. Actually, many of the best paying HITs tend to be spam-related ones.<br/> <br/> <div style="text-align: center;"><a href="https://web.archive.org/web/20101229083934/http://4.bp.blogspot.com/_skxW9kDLt_c/TQqRpWam1qI/AAAAAAAAfn8/9rMKuElheR4/s1600/price_spam_not_spam.PNG" imageanchor="1" style="margin-left: 1em; margin-right: 1em;"><img border="0" height="248" src="https://web.archive.org/web/20101229083934im_/http://4.bp.blogspot.com/_skxW9kDLt_c/TQqRpWam1qI/AAAAAAAAfn8/9rMKuElheR4/s400/price_spam_not_spam.PNG" width="400"/></a></div><div style="text-align: center;"><br/> </div><div style="text-align: left;">By combining the two charts above, we can plot the total value of the spam vs not spam HITs. </div><div class="separator" style="clear: both; text-align: center;"><br/> </div><div class="separator" style="clear: both; text-align: center;"><a href="https://web.archive.org/web/20101229083934/http://3.bp.blogspot.com/_skxW9kDLt_c/TQqWdBnNEgI/AAAAAAAAfoA/8-_jn_yv5MI/s1600/totalvalue_spam_not_spam.PNG" imageanchor="1" style="margin-left: 1em; margin-right: 1em;"><img border="0" height="247" src="https://web.archive.org/web/20101229083934im_/http://3.bp.blogspot.com/_skxW9kDLt_c/TQqWdBnNEgI/AAAAAAAAfoA/8-_jn_yv5MI/s400/totalvalue_spam_not_spam.PNG" width="400"/></a></div><div style="text-align: left;"><br/> </div><div style="text-align: left;"><br/> </div><div style="text-align: left;">Overall, the findings are not really surprising: Most of the spam HITs require large number of workers to complete a task. They want 1000 users to click an ad, not a single user to click a thousand times at a single ad. Therefore, I suspect that most of these spam HITs have a very significant amount of redundancy, (which unfortunately we cannot observe). This means that the total value of the posted spam HITs is most probably much higher than the total value of the legitimate HITs.</div><div style="text-align: left;"><br/> <hr align="center" style="background-color: #691f01; border: 1px; color: #691f01; display: block; height: 2px;" width="50%"/><br/> </div><div style="text-align: left;"><b>What to do?</b></div><div style="text-align: left;"><br/> </div><div style="text-align: left;">These trends are very worrisome:</div><div style="text-align: left;"></div><ul><li>40% of the HITs from new requesters are spam. </li> <li>30% of the new requesters are clear spammers.</li> <li>The spam HITs have bigger value than the legitimate ones. </li> </ul><div>It is very clear that active action should be taken against spam requesters. </div><div><br/> </div><div>According to our measurements, we see approximately <a href="https://web.archive.org/web/20101229083934/http://www.mturk-tracker.com/arrivals/">1500 new HITs arriving in the market every day</a> (from all requesters), and approximately 30 new requester accounts join the market every day. It should be trivial to review all the HITs <b>manually by posting them to MTurk for review.</b> </div><div><br/> </div><div><div>But even if this manual inspection is expensive, this is a task that can be very easily automated. In our current work,<b> we realized that it is very easy to accurately classify HITs as spam or not. A simple SVM linear classifier that uses bag of words as features can achieve a <span class="Apple-style-span" style="color: #990000;">95% true positive and 95% true negative rate</span>. </b>With a moderately advanced scheme, it should be possible to have a strong system in place pretty quickly.<br/> <br/> For whomever is interested, the data is available here<br/> <iframe frameborder="0" height="300" src="https://web.archive.org/web/20101229083934if_/https://spreadsheets.google.com/pub?key=0AjX1e06EhsXSdEhHWndZQ21oV0dERUpwVXA1UlFfX3c&hl=en&single=true&gid=0&output=html&widget=true" width="400"></iframe><br/> <br/> </div><div><br/> </div><div>The disheartening part was the response of Amazon when we informed them about the issue. They pretty much assured us that everything is fine, and they believed there is no problem! For me, this was more problematic than the existence of spam.</div><br/> <hr align="center" style="background-color: #691f01; border: 1px; color: #691f01; display: block; height: 2px;" width="50%"/><br/> <div><b>Why Amazon ignores spam?</b></div><div><br/> To answer this question, I have asked Amazon for access to the data to investigate further. Unfortunately, I was denied access. (It does not pay to <a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/10/plea-to-amazon-fix-mechanical-turk.html">criticize Amazon</a>.) Interestingly enough, the MTurk guys <a href="https://web.archive.org/web/20101229083934/http://www.quora.com/If-you-could-observe-all-transactions-on-the-Amazon-Mechanical-Turk-marketplace-what-would-you-like-to-know">share data with other academics</a>.<br/> <br/> </div><div>The key piece for answering this question, which I cannot get from my data: <b>Do spammers pay the workers?</b> </div></div><div><br/> </div><div>If the spam requesters <b>do not pay</b> the workers, then Amazon <b><i>should </i></b>be more proactive in battling spammer requesters. Workers need to be protected! It is easy to see that it is a death spiral otherwise. The more spammers can get away with getting work done and not paying, the less the workers will trust new requesters. Legitimate new requesters will face a significant uphill battle to convince the workers about their intentions, they will abandon their plans, and let the spammers prevail. We have <a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/07/mechanical-turk-low-wages-and-market.html">a market for lemons</a> on the inverse.</div><div><br/> </div><div>If the spam requesters <b>pay </b>the workers, then there is a cynical explanation: Amazon does not take an active role in cleaning the market because they simply profit from the spam. And it is part of the growth. And nobody within the MTurk division would cut in half the growth rate at this point.<br/> <br/> However, this would be an incredibly short-sighted approach. With the amount of spam in the worker side, and the amount of spam in the requester side, then <b><i>Mechanical Turk would slowly turn into a market where spammers requester talk to spammer workers</i></b>... Ah yes, and academics running experiments...</div></p> <div style="clear: both;"></div> </div> <div class="post-footer"> <script charset="utf-8" src="https://web.archive.org/web/20101229083934js_/http://feeds.feedburner.com/~s/AComputerScientistInABusinessSchool?i=http://behind-the-enemy-lines.blogspot.com/2010/12/mechanical-turk-now-with-4092-spam.html" type="text/javascript"></script> <p class="post-footer-line post-footer-line-1"><span class="post-labels"> Labels: <a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/search/label/mechanical%20turk" rel="tag">mechanical turk</a>, <a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/search/label/spam" rel="tag">spam</a> </span> </p> <p class="post-footer-line post-footer-line-2"><span class="post-author"> Posted by Panos Ipeirotis </span> <span class="post-timestamp"> at <a class="timestamp-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/12/mechanical-turk-now-with-4092-spam.html" title="permanent link">6:49 PM</a> </span> <span class="post-icons"> <span class="item-action"> <a href="https://web.archive.org/web/20101229083934/http://www.blogger.com/email-post.g?blogID=7118563403027467631&postID=2428602678035046823" title="Email Post"> <span class="email-post-icon"> </span> </a> </span> <span class="item-control blog-admin pid-1469181435"> <a href="https://web.archive.org/web/20101229083934/http://www.blogger.com/post-edit.g?blogID=7118563403027467631&postID=2428602678035046823" title="Edit Post"> <img alt="" class="icon-action" height="18" src="https://web.archive.org/web/20101229083934im_/http://img2.blogblog.com/img/icon18_edit_allbkg.gif" width="18"/> </a> </span> </span> </p> <p class="post-footer-line post-footer-line-3"><span class="post-comment-link"> </span> <span class="post-backlinks post-comment-link"> </span> </p> </div> </div> <div class="comments" id="comments"> <a name="comments"></a> <h4> 0 comments: </h4> <div id="Blog2_comments-block-wrapper"> <dl class="avatar-comment-indent" id="comments-block"> </dl> </div> <p class="comment-footer"> <div class="comment-form"> <a name="comment-form"></a> <h4 id="comment-post-message">Post a Comment</h4> <p> </p> <a href="https://web.archive.org/web/20101229083934/http://www.blogger.com/comment-iframe.g?blogID=7118563403027467631&postID=2428602678035046823" id="comment-editor-src"></a> <iframe allowtransparency="true" class="blogger-iframe-colorize blogger-comment-from-post" frameborder="0" height="410" id="comment-editor" name="comment-editor" src="/web/20101229083934if_/http://behind-the-enemy-lines.blogspot.com/2010/12/mechanical-turk-now-with-4092-spam.html" width="100%"></iframe> <script type="text/javascript"> if (!window.google || !google.friendconnect) { document.write('<script type="text/javascript"' + 'src="https://web.archive.org/web/20101229083934/http://www.google.com/friendconnect/script/friendconnect.js">' + '</scr' + 'ipt>'); } </script> <script type="text/javascript"> if (!window.registeredBloggerCallbacks) { window.registeredBloggerCallbacks = true; gadgets.rpc.register('requestReload', function() { document.location.reload(); }); gadgets.rpc.register('requestSignOut', function(siteId) { google.friendconnect.container.openSocialSiteId = siteId; google.friendconnect.requestSignOut(); }); } </script> <script type="text/javascript"> function registerGetBlogUrls() { gadgets.rpc.register('getBlogUrls', function() { var holder = {}; holder.currentPost = "https://web.archive.org/web/20101229083934/http://www.blogger.com/feeds/7118563403027467631/posts/default/2428602678035046823"; holder.currentComments = "https://web.archive.org/web/20101229083934/http://www.blogger.com/feeds/7118563403027467631/2428602678035046823/comments/default"; holder.currentPostUrl = ""; holder.currentPostId = 2428602678035046823 holder.postFeed = "https://web.archive.org/web/20101229083934/http://www.blogger.com/feeds/7118563403027467631/posts/default"; holder.commentFeed = "https://web.archive.org/web/20101229083934/http://www.blogger.com/feeds/7118563403027467631/comments/default"; holder.currentBlogUrl = "https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/"; holder.currentBlogId = "7118563403027467631"; return holder; }); } </script> <script type="text/javascript"> if (!window.registeredCommonBloggerCallbacks) { window.registeredCommonBloggerCallbacks = true; gadgets.rpc.register('resize_iframe', function(height) { var el = document.getElementById(this['f']); if (el) { el.style.height = height + 'px'; } }); gadgets.rpc.register('set_pref', function() {}); registerGetBlogUrls(); } </script> <script type="text/javascript" src="https://web.archive.org/web/20101229083934js_/http://www.blogger.com/static/v1/jsbin/528630121-comment_from_post_iframe.js"></script> <script type="text/javascript"> BLOG_CMT_createIframe('https://web.archive.org/web/20101229083934/http://www.blogger.com/rpc_relay.html', '07711817410234421382'); </script> </div> </p> <div id="backlinks-container"> <div id="Blog2_backlinks-container"> <a name="links"></a><h4> </h4> <p class="comment-footer"> <a class="comment-link" href="" id="Blog2_backlinks-create-link" target="_blank"> </a> </p> </div> </div> </div> </div> <div id="latency-2428602678035046823"></div><script type="text/javascript">if (window['tickAboveFold']) {window['tickAboveFold'](document.getElementById("latency-2428602678035046823")); } </script> </div></div> <!-- google_ad_section_end --> </div> <div class="blog-pager" id="blog-pager"> <span id="blog-pager-newer-link"> <a class="blog-pager-newer-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/12/amazon-reacts-spammers-kicked-out-of.html" id="Blog2_blog-pager-newer-link" title="Newer Post">Newer Post</a> </span> <span id="blog-pager-older-link"> <a class="blog-pager-older-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/12/sharing-code-apis-and-readability-api.html" id="Blog2_blog-pager-older-link" title="Older Post">Older Post</a> </span> <a class="home-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/">Home</a> </div> <div class="clear"></div> <div class="post-feeds"> <div class="feed-links"> Subscribe to: <a class="feed-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/feeds/2428602678035046823/comments/default" target="_blank" type="application/atom+xml">Post Comments (Atom)</a> </div> </div> </div></div> </div> <div id="sidebar-wrapper"> <div class="sidebar section" id="sidebar"><div class="widget Profile" id="Profile2"> <h2>About Me</h2> <div class="widget-content"> <a href="https://web.archive.org/web/20101229083934/http://www.blogger.com/profile/15283752183704062501"><img alt="My Photo" class="profile-img" height="45" src="https://web.archive.org/web/20101229083934im_/http://1.bp.blogspot.com/_skxW9kDLt_c/SqPtaZyiZUI/AAAAAAAAAjM/8gCSDmi3Ts8/S220/IMG_2684.JPG" width="80"/></a> <dl class="profile-datablock"> <dt class="profile-data">Panos Ipeirotis</dt> <dd class="profile-data">New York, NY, United States</dd> <dd class="profile-textblock">I am an Associate Professor at the IOMS Department at Stern School of Business of New York University. I am interested in crowdsourcing and on leveraging economics to solve computer science problems.</dd> </dl> <a class="profile-link" href="https://web.archive.org/web/20101229083934/http://www.blogger.com/profile/15283752183704062501">View my complete profile</a> <div class="clear"></div> <span class="widget-item-control"> <span class="item-control blog-admin"> <a class="quickedit" href="https://web.archive.org/web/20101229083934/http://www.blogger.com/rearrange?blogID=7118563403027467631&widgetType=Profile&widgetId=Profile2&action=editWidget" onclick="return _WidgetManager._PopupConfig(document.getElementById("Profile2"));" target="configProfile2" title="Edit"> <img alt="" height="18" src="https://web.archive.org/web/20101229083934im_/http://img1.blogblog.com/img/icon18_wrench_allbkg.png" width="18"/> </a> </span> </span> <div class="clear"></div> </div> </div><div class="widget HTML" id="HTML2"> <h2 class="title">Subscribe</h2> <div class="widget-content"> <a href="https://web.archive.org/web/20101229083934/http://feeds.feedburner.com/AComputerScientistInABusinessSchool" rel="alternate" type="application/rss+xml"><img alt="" style="vertical-align:middle;border:0" src="https://web.archive.org/web/20101229083934im_/http://www.feedburner.com/fb/images/pub/feed-icon16x16.png"/> </a> <a href="https://web.archive.org/web/20101229083934/http://feeds.feedburner.com/AComputerScientistInABusinessSchool" rel="alternate" type="application/rss+xml">Blog Posts</a> <br/> <a href="https://web.archive.org/web/20101229083934/http://feeds.feedburner.com/Comments_AComputerScientistInABusinessSchool" rel="alternate" type="application/rss+xml"><img alt="" style="vertical-align:middle;border:0" src="https://web.archive.org/web/20101229083934im_/http://www.feedburner.com/fb/images/pub/feed-icon16x16.png"/> </a> <a href="https://web.archive.org/web/20101229083934/http://feeds.feedburner.com/Comments_AComputerScientistInABusinessSchool" rel="alternate" type="application/rss+xml">Blog Comments</a> <br/> <a href="https://web.archive.org/web/20101229083934/http://feedburner.google.com/fb/a/mailverify?uri=AComputerScientistInABusinessSchool&loc=en_US"><img alt="" style="vertical-align:middle;border:0" src="https://web.archive.org/web/20101229083934im_/http://pages.stern.nyu.edu/~panos/blog/email.jpg"/></a> <a href="https://web.archive.org/web/20101229083934/http://feedburner.google.com/fb/a/mailverify?uri=AComputerScientistInABusinessSchool&loc=en_US">Subscribe by Email</a> </div> <div class="clear"></div> <span class="widget-item-control"> <span class="item-control blog-admin"> <a class="quickedit" href="https://web.archive.org/web/20101229083934/http://www.blogger.com/rearrange?blogID=7118563403027467631&widgetType=HTML&widgetId=HTML2&action=editWidget" onclick="return _WidgetManager._PopupConfig(document.getElementById("HTML2"));" target="configHTML2" title="Edit"> <img alt="" height="18" src="https://web.archive.org/web/20101229083934im_/http://img1.blogblog.com/img/icon18_wrench_allbkg.png" width="18"/> </a> </span> </span> <div class="clear"></div> </div><div class="widget Gadget" id="Gadget2"> <h2 class="title">Twitter Updates</h2> <script type="text/javascript"> if (!window.google || !google.friendconnect) { document.write('<script type="text/javascript"' + 'src="https://web.archive.org/web/20101229083934/http://www.google.com/friendconnect/script/friendconnect.js">' + '</scr' + 'ipt>'); } </script> <script type="text/javascript"> if (!window.registeredBloggerCallbacks) { window.registeredBloggerCallbacks = true; gadgets.rpc.register('requestReload', function() { document.location.reload(); }); gadgets.rpc.register('requestSignOut', function(siteId) { google.friendconnect.container.openSocialSiteId = siteId; google.friendconnect.requestSignOut(); }); } </script> <script type="text/javascript"> function registerGetBlogUrls() { gadgets.rpc.register('getBlogUrls', function() { var holder = {}; holder.currentPost = "https://web.archive.org/web/20101229083934/http://www.blogger.com/feeds/7118563403027467631/posts/default/2428602678035046823"; holder.currentComments = "https://web.archive.org/web/20101229083934/http://www.blogger.com/feeds/7118563403027467631/2428602678035046823/comments/default"; holder.currentPostUrl = ""; holder.currentPostId = 2428602678035046823 holder.postFeed = "https://web.archive.org/web/20101229083934/http://www.blogger.com/feeds/7118563403027467631/posts/default"; holder.commentFeed = "https://web.archive.org/web/20101229083934/http://www.blogger.com/feeds/7118563403027467631/comments/default"; holder.currentBlogUrl = "https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/"; holder.currentBlogId = "7118563403027467631"; return holder; }); } </script> <script type="text/javascript"> if (!window.registeredCommonBloggerCallbacks) { window.registeredCommonBloggerCallbacks = true; gadgets.rpc.register('resize_iframe', function(height) { var el = document.getElementById(this['f']); if (el) { el.style.height = height + 'px'; } }); gadgets.rpc.register('set_pref', function() {}); registerGetBlogUrls(); } </script> <div id="div-re0sypq5cp8p" style="width: 100%; "></div> <script type="text/javascript"> var skin = {}; skin['FACE_SIZE'] = '32'; skin['HEIGHT'] = "200"; skin['TITLE'] = "Twitter Updates"; skin['BORDER_COLOR'] = "transparent"; skin['ENDCAP_BG_COLOR'] = "transparent"; skin['ENDCAP_TEXT_COLOR'] = "#634320"; skin['ENDCAP_LINK_COLOR'] = "#e2a059"; skin['ALTERNATE_BG_COLOR'] = "transparent"; skin['CONTENT_BG_COLOR'] = "transparent"; skin['CONTENT_LINK_COLOR'] = "#e2a059"; skin['CONTENT_TEXT_COLOR'] = "#634320"; skin['CONTENT_SECONDARY_LINK_COLOR'] = "#e2a059"; skin['CONTENT_SECONDARY_TEXT_COLOR'] = "#000000"; skin['CONTENT_HEADLINE_COLOR'] = "#000000"; skin['FONT_FACE'] = "normal normal 100% Helvetica,Arial,Verdana,\x27Trebuchet MS\x27, Sans-serif"; google.friendconnect.container.setParentUrl("/"); google.friendconnect.container["renderOpenSocialGadget"]( {id: "div-re0sypq5cp8p", height: 200, url: "https://web.archive.org/web/20101229083934/http://gadgetsforblogger.googlecode.com/files/twitter-gadget-v1-3.xml", "view-params": {"displayLink":true,"myUsername":"ipeirotis","myUpdates":"5"}, "prefs": {"displayLink":"1","myUsername":"ipeirotis","myUpdates":"5"}, site: "07711817410234421382", locale: 'en_US' }, skin); </script> <div class="clear"></div> <span class="widget-item-control"> <span class="item-control blog-admin"> <a class="quickedit" href="https://web.archive.org/web/20101229083934/http://www.blogger.com/rearrange?blogID=7118563403027467631&widgetType=Gadget&widgetId=Gadget2&action=editWidget" onclick="return _WidgetManager._PopupConfig(document.getElementById("Gadget2"));" target="configGadget2" title="Edit"> <img alt="" height="18" src="https://web.archive.org/web/20101229083934im_/http://img1.blogblog.com/img/icon18_wrench_allbkg.png" width="18"/> </a> </span> </span> <div class="clear"></div> </div><div class="widget Stats" id="Stats1"> <h2>Total Pageviews</h2> <div class="widget-content"> <div id="Stats1_content" style="display: none;"> <img alt="Sparkline" height="30" id="Stats1_sparkline" src="/web/20101229083934im_/http://behind-the-enemy-lines.blogspot.com/2010/12/mechanical-turk-now-with-4092-spam.html" width="75"/> <span class="counter-wrapper text-counter-wrapper" id="Stats1_totalCount"></span> <div class="clear"></div> <span class="widget-item-control"> <span class="item-control blog-admin"> <a class="quickedit" href="https://web.archive.org/web/20101229083934/http://www.blogger.com/rearrange?blogID=7118563403027467631&widgetType=Stats&widgetId=Stats1&action=editWidget" onclick="return _WidgetManager._PopupConfig(document.getElementById("Stats1"));" target="configStats1" title="Edit"> <img alt="" height="18" src="https://web.archive.org/web/20101229083934im_/http://img1.blogblog.com/img/icon18_wrench_allbkg.png" width="18"/> </a> </span> </span> <div class="clear"></div> </div> </div> </div><div class="widget PopularPosts" id="PopularPosts1"> <h2>Popular Posts</h2> <div class="widget-content popular-posts"> <ul> <li> <a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/12/mechanical-turk-now-with-4092-spam.html">Mechanical Turk: Now with 40.92% spam.</a> </li> <li> <a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/10/plea-to-amazon-fix-mechanical-turk.html">A Plea to Amazon: Fix Mechanical Turk!</a> </li> <li> <a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/10/cease-and-desist.html">Cease and desist...</a> </li> <li> <a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/10/explosion-of-micro-crowdsourcing.html">The Explosion of Micro-Crowdsourcing Services</a> </li> <li> <a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/12/sharing-code-apis-and-readability-api.html">Sharing code, API's, and a Readability API</a> </li> <li> <a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/11/wisdom-of-crowds-when-do-we-need.html">Wisdom of the Crowds: When do we need Independence?</a> </li> <li> <a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/12/excerpts-from-communist-manifesto.html">Excerpts from "The Communist Manifesto"</a> </li> <li> <a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/12/amazon-reacts-spammers-kicked-out-of.html">Amazon Reacts: Spammers Kicked Out of MTurk!</a> </li> <li> <a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/07/mechanical-turk-low-wages-and-market.html">Mechanical Turk, Low Wages, and the Market for Lemons</a> </li> <li> <a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/03/new-demographics-of-mechanical-turk.html">The New Demographics of Mechanical Turk</a> </li> </ul> <div class="clear"></div> <span class="widget-item-control"> <span class="item-control blog-admin"> <a class="quickedit" href="https://web.archive.org/web/20101229083934/http://www.blogger.com/rearrange?blogID=7118563403027467631&widgetType=PopularPosts&widgetId=PopularPosts1&action=editWidget" onclick="return _WidgetManager._PopupConfig(document.getElementById("PopularPosts1"));" target="configPopularPosts1" title="Edit"> <img alt="" height="18" src="https://web.archive.org/web/20101229083934im_/http://img1.blogblog.com/img/icon18_wrench_allbkg.png" width="18"/> </a> </span> </span> <div class="clear"></div> </div> </div><div class="widget BlogArchive" id="BlogArchive2"> <h2>Blog Archive</h2> <div class="widget-content"> <div id="ArchiveList"> <div id="BlogArchive2_ArchiveList"> <ul class="hierarchy"> <li class="archivedate expanded"> <a class="toggle" href="javascript:void(0)"> <span class="zippy toggle-open">▼ </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/search?updated-min=2010-01-01T00%3A00%3A00-05%3A00&updated-max=2011-01-01T00%3A00%3A00-05%3A00&max-results=40">2010</a> <span class="post-count" dir="ltr">(40)</span> <ul class="hierarchy"> <li class="archivedate expanded"> <a class="toggle" href="javascript:void(0)"> <span class="zippy toggle-open">▼ </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010_12_01_archive.html">December</a> <span class="post-count" dir="ltr">(4)</span> <ul class="posts"> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/12/amazon-reacts-spammers-kicked-out-of.html">Amazon Reacts: Spammers Kicked Out of MTurk!</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/12/mechanical-turk-now-with-4092-spam.html">Mechanical Turk: Now with 40.92% spam.</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/12/sharing-code-apis-and-readability-api.html">Sharing code, API's, and a Readability API</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/12/excerpts-from-communist-manifesto.html">Excerpts from "The Communist Manifesto"</a></li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010_11_01_archive.html">November</a> <span class="post-count" dir="ltr">(4)</span> <ul class="posts"> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/11/wisdom-of-crowds-when-do-we-need.html">Wisdom of the Crowds: When do we need Independence...</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/11/mechanical-turk-interesting-tasks-and.html">Mechanical Turk, "Interesting Tasks," and Cognitiv...</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/11/nyc-i-love-your-data.html">NYC, I Love You(r Data)</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/11/introductory-research-course-replicate.html">Introductory Research Course: Replicate a Paper</a></li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010_10_01_archive.html">October</a> <span class="post-count" dir="ltr">(10)</span> <ul class="posts"> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/10/cease-and-desist.html">Cease and desist...</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/10/student-websites.html">Student websites</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/10/can-crowdsourcing-scale-role-of-active.html">Can Crowdsourcing Scale? The Role of Active Learni...</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/10/plea-to-amazon-fix-mechanical-turk.html">A Plea to Amazon: Fix Mechanical Turk!</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/10/mechanical-turk-and-data-driven.html">Mechanical Turk and Data Driven Journalism: The Ca...</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/10/be-top-mechanical-turk-worker-you-need.html">Be a Top Mechanical Turk Worker: You Need $5 and 5...</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/10/explosion-of-micro-crowdsourcing.html">The Explosion of Micro-Crowdsourcing Services</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/10/explosion-of-crowdsourcing-workshops.html">The Explosion of Crowdsourcing Workshops</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/10/mechanical-turk-requester-activity.html">Mechanical Turk Requester Activity: The Insignific...</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/10/what-tasks-are-posted-on-mechanical.html">What Tasks Are Posted on Mechanical Turk?</a></li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010_09_01_archive.html">September</a> <span class="post-count" dir="ltr">(2)</span> <ul class="posts"> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/09/worker-evaluation-in-crowdsourcing-gold.html">Worker Evaluation in Crowdsourcing: Gold Data or M...</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/09/analytics-for-class-lectures.html">Analytics for Class Lectures</a></li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010_08_01_archive.html">August</a> <span class="post-count" dir="ltr">(1)</span> <ul class="posts"> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/08/reputation-integration-and-future-of.html">Reputation Integration and the Future of Reviews</a></li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010_07_01_archive.html">July</a> <span class="post-count" dir="ltr">(4)</span> <ul class="posts"> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/07/mechanical-turk-low-wages-and-market.html">Mechanical Turk, Low Wages, and the Market for Lem...</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/07/peer-reviewing-for-oral-presentations.html">Peer Reviewing for Oral Presentations?</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/07/liveblogging-from-hcomp-2010.html">Liveblogging from HCOMP 2010</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/07/detecting-spammers-on-mechanical-turk.html">Detecting Spammers on Mechanical Turk, Part II</a></li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010_06_01_archive.html">June</a> <span class="post-count" dir="ltr">(1)</span> <ul class="posts"> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/06/detecting-spammers-on-mechanical-turk.html">Detecting Spammers on Mechanical Turk, Part I</a></li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010_05_01_archive.html">May</a> <span class="post-count" dir="ltr">(6)</span> <ul class="posts"> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/05/accepted-papers-for-hcomp-2010.html">Accepted Papers for HCOMP 2010</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/05/prediction-optimizers.html">Prediction Optimizers</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/05/google-prediction-api-commoditization.html">Google Prediction API: Commoditization of Large-Sc...</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/05/google-scholar-now-supports-email.html">Google Scholar now Supports Email Alerts</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/05/crowdsourcing-not-just-cost-saver.html">Crowdsourcing: Not just a cost saver</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/05/kdd-accepted-paper-hcomp-and-sna.html">KDD Accepted Papers, Deadlines for HCOMP 2010 and ...</a></li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010_04_01_archive.html">April</a> <span class="post-count" dir="ltr">(2)</span> <ul class="posts"> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/04/yahoos-key-scientific-challenges-your.html">Yahoo!'s Key Scientific Challenges: Your student i...</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/04/stop-publishing.html">Stop Publishing!</a></li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010_03_01_archive.html">March</a> <span class="post-count" dir="ltr">(3)</span> <ul class="posts"> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/03/getting-high-quality-results-on-mturk.html">Getting High Quality Results on MTurk</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/03/citation-tracker-now-with-api.html">Citation Tracker: Now with an API</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/03/new-demographics-of-mechanical-turk.html">The New Demographics of Mechanical Turk</a></li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010_02_01_archive.html">February</a> <span class="post-count" dir="ltr">(1)</span> <ul class="posts"> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/02/why-mechanical-turk-allows-only-us.html">Why Mechanical Turk Allows Only US-based Requester...</a></li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010_01_01_archive.html">January</a> <span class="post-count" dir="ltr">(2)</span> <ul class="posts"> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/01/universities-and-intellectual-property.html">Universities and Intellectual Property: A Minefiel...</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/01/did-you-find-this-helpful.html">Did you find this helpful?</a></li> </ul> </li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/search?updated-min=2009-01-01T00%3A00%3A00-05%3A00&updated-max=2010-01-01T00%3A00%3A00-05%3A00&max-results=41">2009</a> <span class="post-count" dir="ltr">(41)</span> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009_12_01_archive.html">December</a> <span class="post-count" dir="ltr">(1)</span> <ul class="posts"> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009/12/prisoners-dilemma-and-mechanical-turk.html">Prisoner's Dilemma and Mechanical Turk</a></li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009_11_01_archive.html">November</a> <span class="post-count" dir="ltr">(4)</span> <ul class="posts"> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009/11/anchoring-and-mechanical-turk.html">Anchoring and Mechanical Turk</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009/11/ignore-test.html">Ignore.. (Test)</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009/11/using-nyc-data-mine-for-intro-database.html">Using the NYC Data Mine for an Intro Database Assi...</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009/11/utility-of-money-and-st-petersburg.html">Utility of Money and the St. Petersburg Paradox</a></li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009_10_01_archive.html">October</a> <span class="post-count" dir="ltr">(2)</span> <ul class="posts"> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009/10/what-is-real-cost-of-open-access.html">What is the (Real) Cost of Open Access?</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009/10/when-noise-is-your-friend-smoothed.html">When Noise is Your Friend: Smoothed Analysis</a></li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009_09_01_archive.html">September</a> <span class="post-count" dir="ltr">(3)</span> <ul class="posts"> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009/09/rationality-pnp-prediction-markets-and.html">Rationality, P=NP, Prediction Markets, and a Parad...</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009/09/citation-tracker-monitoring-citations.html">Citation Tracker: Monitoring Citations to your Pub...</a></li> <li><a href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009/09/different-attitudes-of-computer.html">The different attitudes of computer scientists and...</a></li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009_08_01_archive.html">August</a> <span class="post-count" dir="ltr">(4)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009_07_01_archive.html">July</a> <span class="post-count" dir="ltr">(4)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009_06_01_archive.html">June</a> <span class="post-count" dir="ltr">(3)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009_05_01_archive.html">May</a> <span class="post-count" dir="ltr">(2)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009_04_01_archive.html">April</a> <span class="post-count" dir="ltr">(2)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009_03_01_archive.html">March</a> <span class="post-count" dir="ltr">(5)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009_02_01_archive.html">February</a> <span class="post-count" dir="ltr">(6)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2009_01_01_archive.html">January</a> <span class="post-count" dir="ltr">(5)</span> </li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/search?updated-min=2008-01-01T00%3A00%3A00-05%3A00&updated-max=2009-01-01T00%3A00%3A00-05%3A00&max-results=47">2008</a> <span class="post-count" dir="ltr">(47)</span> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2008_11_01_archive.html">November</a> <span class="post-count" dir="ltr">(5)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2008_10_01_archive.html">October</a> <span class="post-count" dir="ltr">(6)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2008_09_01_archive.html">September</a> <span class="post-count" dir="ltr">(4)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2008_08_01_archive.html">August</a> <span class="post-count" dir="ltr">(1)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2008_07_01_archive.html">July</a> <span class="post-count" dir="ltr">(4)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2008_06_01_archive.html">June</a> <span class="post-count" dir="ltr">(2)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2008_05_01_archive.html">May</a> <span class="post-count" dir="ltr">(3)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2008_04_01_archive.html">April</a> <span class="post-count" dir="ltr">(3)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2008_03_01_archive.html">March</a> <span class="post-count" dir="ltr">(8)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2008_02_01_archive.html">February</a> <span class="post-count" dir="ltr">(6)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2008_01_01_archive.html">January</a> <span class="post-count" dir="ltr">(5)</span> </li> </ul> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/search?updated-min=2007-01-01T00%3A00%3A00-05%3A00&updated-max=2008-01-01T00%3A00%3A00-05%3A00&max-results=32">2007</a> <span class="post-count" dir="ltr">(32)</span> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2007_12_01_archive.html">December</a> <span class="post-count" dir="ltr">(5)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2007_11_01_archive.html">November</a> <span class="post-count" dir="ltr">(5)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2007_10_01_archive.html">October</a> <span class="post-count" dir="ltr">(4)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2007_09_01_archive.html">September</a> <span class="post-count" dir="ltr">(3)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2007_08_01_archive.html">August</a> <span class="post-count" dir="ltr">(2)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2007_07_01_archive.html">July</a> <span class="post-count" dir="ltr">(5)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2007_06_01_archive.html">June</a> <span class="post-count" dir="ltr">(5)</span> </li> </ul> <ul class="hierarchy"> <li class="archivedate collapsed"> <a class="toggle" href="javascript:void(0)"> <span class="zippy"> ►  </span> </a> <a class="post-count-link" href="https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2007_05_01_archive.html">May</a> <span class="post-count" dir="ltr">(3)</span> </li> </ul> </li> </ul> </div> </div> <div class="clear"></div> <span class="widget-item-control"> <span class="item-control blog-admin"> <a class="quickedit" href="https://web.archive.org/web/20101229083934/http://www.blogger.com/rearrange?blogID=7118563403027467631&widgetType=BlogArchive&widgetId=BlogArchive2&action=editWidget" onclick="return _WidgetManager._PopupConfig(document.getElementById("BlogArchive2"));" target="configBlogArchive2" title="Edit"> <img alt="" height="18" src="https://web.archive.org/web/20101229083934im_/http://img1.blogblog.com/img/icon18_wrench_allbkg.png" width="18"/> </a> </span> </span> <div class="clear"></div> </div> </div><div class="widget HTML" id="HTML4"> <div class="widget-content"> <img src="https://web.archive.org/web/20101229083934im_/http://postrank.com/graphics/blog_claim.png?s=cp3lj7k"/> </div> <div class="clear"></div> <span class="widget-item-control"> <span class="item-control blog-admin"> <a class="quickedit" href="https://web.archive.org/web/20101229083934/http://www.blogger.com/rearrange?blogID=7118563403027467631&widgetType=HTML&widgetId=HTML4&action=editWidget" onclick="return _WidgetManager._PopupConfig(document.getElementById("HTML4"));" target="configHTML4" title="Edit"> <img alt="" height="18" src="https://web.archive.org/web/20101229083934im_/http://img1.blogblog.com/img/icon18_wrench_allbkg.png" width="18"/> </a> </span> </span> <div class="clear"></div> </div><div class="widget HTML" id="HTML1"> <div class="widget-content"> <script src="https://web.archive.org/web/20101229083934js_/http://www.watchmath.com/cgi-bin/mathtex3.js" type="text/javascript"></script> <script type="text/javascript"> replaceMath( document.body );</script> </div> <div class="clear"></div> <span class="widget-item-control"> <span class="item-control blog-admin"> <a class="quickedit" href="https://web.archive.org/web/20101229083934/http://www.blogger.com/rearrange?blogID=7118563403027467631&widgetType=HTML&widgetId=HTML1&action=editWidget" onclick="return _WidgetManager._PopupConfig(document.getElementById("HTML1"));" target="configHTML1" title="Edit"> <img alt="" height="18" src="https://web.archive.org/web/20101229083934im_/http://img1.blogblog.com/img/icon18_wrench_allbkg.png" width="18"/> </a> </span> </span> <div class="clear"></div> </div><div class="widget HTML" id="HTML3"> <script type="text/javascript"> var disqus_shortname = 'behind-the-enemy-lines'; var disqus_blogger_current_url = 'https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/12/mechanical-turk-now-with-4092-spam.html'; </script> <style type="text/css"> #comments {display:none;} </style> <script type="text/javascript"> (function() { var bloggerjs = document.createElement('script'); bloggerjs.type = 'text/javascript'; bloggerjs.async = true; bloggerjs.src = 'http://'+disqus_shortname+'.disqus.com/blogger_item.js'; (document.getElementsByTagName('head')[0] || document.getElementsByTagName('body')[0]).appendChild(bloggerjs); })(); </script> <style type="text/css"> .post-comment-link { visibility: hidden; } </style> <script type="text/javascript"> (function() { var bloggerjs = document.createElement('script'); bloggerjs.type = 'text/javascript'; bloggerjs.async = true; bloggerjs.src = 'http://'+disqus_shortname+'.disqus.com/blogger_index.js'; (document.getElementsByTagName('head')[0] || document.getElementsByTagName('body')[0]).appendChild(bloggerjs); })(); </script> </div></div> </div> <!-- spacer for skins that want sidebar and main to be the same height--> <div class="clear"> </div> </div> <!-- end content-wrapper --> <div id="footer-wrapper"> <div class="footer section" id="footer"></div> </div> </div></div> <!-- end outer-wrapper --> <script type="text/javascript"> if (window.jstiming) window.jstiming.load.tick('widgetJsBefore'); </script><script type="text/javascript" src="https://web.archive.org/web/20101229083934js_/http://www.blogger.com/static/v1/widgets/512629240-widgets.js"></script> <script type="text/javascript"> if (typeof(BLOG_attachCsiOnload) != 'undefined' && BLOG_attachCsiOnload != null) { window['blogger_templates_experiment_id'] = "templatesV1";window['blogger_blog_id'] = '7118563403027467631';BLOG_attachCsiOnload('item_'); }_WidgetManager._Init('https://web.archive.org/web/20101229083934/http://www.blogger.com/rearrange?blogID=7118563403027467631','https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/12/mechanical-turk-now-with-4092-spam.html','7118563403027467631'); _WidgetManager._SetPageActionUrl('https://web.archive.org/web/20101229083934/http://www.blogger.com/display?blogID=7118563403027467631','H2XI9R7CMMFsbTJ6TmyPuKunJn4:1293611405037','AOuZoY5YWYEHoQ0w1lqHldfPj8v9d5XGRg:1293611405037'); _WidgetManager._SetDataContext([{'name': 'blog', 'data': {'title': 'A Computer Scientist in a Business School', 'pageType': 'item', 'url': 'https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/12/mechanical-turk-now-with-4092-spam.html', 'canonicalUrl': 'https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/2010/12/mechanical-turk-now-with-4092-spam.html', 'homepageUrl': 'https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/', 'enabledCommentProfileImages': true, 'searchLabel': '', 'searchQuery': '', 'pageName': 'Mechanical Turk: Now with 40.92% spam.', 'pageTitle': 'A Computer Scientist in a Business School: Mechanical Turk: Now with 40.92% spam.', 'encoding': 'UTF-8', 'locale': 'en-US', 'isPrivate': false, 'isMobile': false, 'mobileClass': '', 'languageDirection': 'ltr', 'feedLinks': '\74link rel\75\42alternate\42 type\75\42application/atom+xml\42 title\75\42A Computer Scientist in a Business School - Atom\42 href\75\42http://behind-the-enemy-lines.blogspot.com/feeds/posts/default\42 /\76\n\74link rel\75\42alternate\42 type\75\42application/rss+xml\42 title\75\42A Computer Scientist in a Business School - RSS\42 href\75\42http://behind-the-enemy-lines.blogspot.com/feeds/posts/default?alt\75rss\42 /\76\n\74link rel\75\42service.post\42 type\75\42application/atom+xml\42 title\75\42A Computer Scientist in a Business School - Atom\42 href\75\42http://www.blogger.com/feeds/7118563403027467631/posts/default\42 /\76\n\74link rel\75\42EditURI\42 type\75\42application/rsd+xml\42 title\75\42RSD\42 href\75\42http://www.blogger.com/rsd.g?blogID\0757118563403027467631\42 /\76\n\74link rel\75\42alternate\42 type\75\42application/atom+xml\42 title\75\42A Computer Scientist in a Business School - Atom\42 href\75\42http://behind-the-enemy-lines.blogspot.com/feeds/2428602678035046823/comments/default\42 /\76\n', 'meTag': '', 'openIdOpTag': '', 'imageSrcTag': '\74link rel\75\42image_src\42 href\75\42http://2.bp.blogspot.com/_skxW9kDLt_c/TQpWpze7-VI/AAAAAAAAfn0/02yFP0s79eQ/s72-c/spam-vs-notspam.PNG\42 /\76\n', 'latencyHeadScript': '\74script type\75\42text/javascript\42\76(function() { var a\75window;function c(b){this.t\75{};this.tick\75function(d,i,e){e\75e?e:(new Date).getTime();this.t[d]\75[e,i]};this.tick(\42start\42,null,b)}var f\75new c;a.jstiming\75{Timer:c,load:f};try{var g\75null;if(a.chrome\46\46a.chrome.csi)g\75Math.floor(a.chrome.csi().pageT);if(g\75\75null)if(a.gtbExternal)g\75a.gtbExternal.pageT();if(g\75\75null)if(a.external)g\75a.external.pageT;if(g)a.jstiming.pt\75g}catch(h){};a.tickAboveFold\75function(b){b\75b;var d\0750;if(b.offsetParent){do d+\75b.offsetTop;while(b\75b.offsetParent)}b\75d;b\74\075750\46\46a.jstiming.load.tick(\42aft\42)};var j\75false;function k(){if(!j){j\75true;a.jstiming.load.tick(\42firstScrollTime\42)}}a.addEventListener?a.addEventListener(\42scroll\42,k,false):a.attachEvent(\42onscroll\42,k);\n })();\74/script\076', 'mobileHeadScript': ''}}]); _WidgetManager._RegisterWidget('_ProfileView', new _WidgetInfo('Profile2', 'sidebar', null, document.getElementById('Profile2'), {}, 'displayModeFull')); _WidgetManager._RegisterWidget('_HTMLView', new _WidgetInfo('HTML2', 'sidebar', null, document.getElementById('HTML2'), {}, 'displayModeFull')); _WidgetManager._RegisterWidget('_GadgetView', new _WidgetInfo('Gadget2', 'sidebar', null, document.getElementById('Gadget2'), {}, 'displayModeFull')); _WidgetManager._RegisterWidget('_StatsView', new _WidgetInfo('Stats1', 'sidebar', null, document.getElementById('Stats1'), {'title': 'Total Pageviews', 'showGraphicalCounter': false, 'showAnimatedCounter': false, 'showSparkline': true, 'statsUrl': 'https://web.archive.org/web/20101229083934/http://behind-the-enemy-lines.blogspot.com/b/stats?style\75BLACK_TRANSPARENT\46timeRange\75ALL_TIME\46token\0757gL3Mi0BAAA.7K_f2mQ2ZOaJpDqWR6SeqtDcwgH99T59GpsEbXbMFXk.dAPzUvLQVK0VEZ0pYdbdvw'}, 'displayModeFull')); _WidgetManager._RegisterWidget('_PopularPostsView', new _WidgetInfo('PopularPosts1', 'sidebar', null, document.getElementById('PopularPosts1'), {}, 'displayModeFull')); _WidgetManager._RegisterWidget('_BlogArchiveView', new _WidgetInfo('BlogArchive2', 'sidebar', null, document.getElementById('BlogArchive2'), {'languageDirection': 'ltr'}, 'displayModeFull')); _WidgetManager._RegisterWidget('_HTMLView', new _WidgetInfo('HTML4', 'sidebar', null, document.getElementById('HTML4'), {}, 'displayModeFull')); _WidgetManager._RegisterWidget('_HTMLView', new _WidgetInfo('HTML1', 'sidebar', null, document.getElementById('HTML1'), {}, 'displayModeFull')); _WidgetManager._RegisterWidget('_HTMLView', new _WidgetInfo('HTML3', 'sidebar', null, document.getElementById('HTML3'), {}, 'displayModeFull')); _WidgetManager._RegisterWidget('_HeaderView', new _WidgetInfo('Header1', 'header')); _WidgetManager._RegisterWidget('_NavbarView', new _WidgetInfo('Navbar1', 'navbar')); _WidgetManager._RegisterWidget('_BlogView', new _WidgetInfo('Blog2', 'main', null, document.getElementById('Blog2'), {'cmtInteractionsEnabled': false, 'commentInteractionIframeUrl': 'https://web.archive.org/web/20101229083934/http://www.blogger.com/comment-interaction-iframe.g?blogId\0757118563403027467631', 'showBacklinks': true, 'postId': '2428602678035046823', 'mobile': false}, 'displayModeFull')); </script> </body> </html><!-- FILE ARCHIVED ON 08:39:34 Dec 29, 2010 AND RETRIEVED FROM THE INTERNET ARCHIVE ON 17:41:42 Feb 21, 2025. JAVASCRIPT APPENDED BY WAYBACK MACHINE, COPYRIGHT INTERNET ARCHIVE. ALL OTHER CONTENT MAY ALSO BE PROTECTED BY COPYRIGHT (17 U.S.C. SECTION 108(a)(3)). --> <!-- playback timings (ms): captures_list: 0.833 exclusion.robots: 0.035 exclusion.robots.policy: 0.021 esindex: 0.018 cdx.remote: 7.17 LoadShardBlock: 1638.635 (3) PetaboxLoader3.datanode: 1100.79 (4) PetaboxLoader3.resolve: 1984.193 (2) load_resource: 1840.01 -->