// ==UserScript== // @name HIT Scraper WITH EXPORT // @author Kerek and TJ // @description Snag HITs. // Based in part on code from mmmturkeybacon Export Mturk History and mmmturkeybacon Color Coded Search with Checkpoints // @namespace http://userscripts.org/users/536998 // @match https://www.mturk.com/mturk/findhits?match=true#hit_scraper* // @match https://www.mturk.com/mturk/findhits?match=true?hit_scraper* // @version 1.5.4 // @grant GM_xmlhttpRequest // @require http://code.jquery.com/jquery-latest.min.js // @downloadURL none // ==/UserScript== //Fixes it soas not to rely on GM's storage schemes if (!this.GM_getValue || (this.GM_getValue.toString && this.GM_getValue.toString().indexOf("not supported")>-1)) { this.GM_getValue=function (key,def) { return localStorage[key] || def; }; this.GM_setValue=function (key,value) { return localStorage[key]=value; }; this.GM_deleteValue=function (key) { return localStorage.removeItem(key); }; } //alter the requester ignore last as you desire, case insensitive var default_list = ["oscar smith", "Diamond Tip Research LLC", "jonathon weber", "jerry torres", "Crowdsource", "we-pay-you-fast", "turk experiment", "jon brelig"]; var ignore_list = default_list; if (GM_getValue("scraper_ignore_list")) ignore_list = GM_getValue("scraper_ignore_list").split('^'); else GM_setValue("scraper_ignore_list", default_list.join('^')); var include_list = []; if (GM_getValue("scraper_include_list")) include_list = GM_getValue("scraper_include_list").split('^'); //This is to update the hit export symbol var symbol = "☭"; //this searches extra pages if you skip too much, helps fill out results if you hit a chunk of ignored HITs. Change to true for this behavior. var correct_for_skips = true; //weight the four TO ratings for the coloring. Default has pay twice as important as fairness and nothing for communication and fast. var COMM_WEIGHT = 0; var PAY_WEIGHT = 10; var FAIR_WEIGHT = 5; var FAST_WEIGHT = 0; //Used for themeing, change the colors to change how scraper looks var GREEN = '#66CC66'; // > 4 var LIGHTGREEN = '#ADFF2F'; // > 3 GREEN YELLOW var YELLOW = '#FFD700'; //Not used var ORANGE = '#FF9900'; // > 2 var RED = '#FF3030'; // <= 2 var BLUE = '#C0D9D9'; // no TO var GREY = 'lightGrey'; //TO down var BROWN = '#94704D'; //Font color var DARKGREY = '#9F9F9F'; //No HITDB, "Not Qualified" column var BACKGROUND_COLOR = "rgb(19, 19, 19)"; //Background of page //display your hitdb records if applicable var check_hitDB = true; //default text size var default_text_size=11; //set to "true" to override checkbox setting and ding on new hits var newHitDing = false; //DO NOT EDIT ANYTHING BELOW THIS LINE UNLESS YOU KNOW WHAT YOU ARE DOING! var status_text = "None"; var shouldDing = false; var audio = document.createElement('audio'); document.body.appendChild(audio); audio.src = 'data:audio/ogg;base64,T2dnUwACAAAAAAAAAAB8mpoRAAAAAFLKt9gBHgF2b3JiaXMAAAAAARErAAAAAAAAkGUAAAAAAACZAU9nZ1MAAAAAAAAAAAAAfJqaEQEAAACHYsq6Cy3///////////+1A3ZvcmJpcx0AAABYaXBoLk9yZyBsaWJWb3JiaXMgSSAyMDA1MDMwNAAAAAABBXZvcmJpcxJCQ1YBAAABAAxSFCElGVNKYwiVUlIpBR1jUFtHHWPUOUYhZBBTiEkZpXtPKpVYSsgRUlgpRR1TTFNJlVKWKUUdYxRTSCFT1jFloXMUS4ZJCSVsTa50FkvomWOWMUYdY85aSp1j1jFFHWNSUkmhcxg6ZiVkFDpGxehifDA6laJCKL7H3lLpLYWKW4q91xpT6y2EGEtpwQhhc+211dxKasUYY4wxxsXiUyiC0JBVAAABAABABAFCQ1YBAAoAAMJQDEVRgNCQVQBABgCAABRFcRTHcRxHkiTLAkJDVgEAQAAAAgAAKI7hKJIjSZJkWZZlWZameZaouaov+64u667t6roOhIasBADIAAAYhiGH3knMkFOQSSYpVcw5CKH1DjnlFGTSUsaYYoxRzpBTDDEFMYbQKYUQ1E45pQwiCENInWTOIEs96OBi5zgQGrIiAIgCAACMQYwhxpBzDEoGIXKOScggRM45KZ2UTEoorbSWSQktldYi55yUTkompbQWUsuklNZCKwUAAAQ4AAAEWAiFhqwIAKIAABCDkFJIKcSUYk4xh5RSjinHkFLMOcWYcowx6CBUzDHIHIRIKcUYc0455iBkDCrmHIQMMgEAAAEOAAABFkKhISsCgDgBAIMkaZqlaaJoaZooeqaoqqIoqqrleabpmaaqeqKpqqaquq6pqq5seZ5peqaoqp4pqqqpqq5rqqrriqpqy6ar2rbpqrbsyrJuu7Ks256qyrapurJuqq5tu7Js664s27rkearqmabreqbpuqrr2rLqurLtmabriqor26bryrLryratyrKua6bpuqKr2q6purLtyq5tu7Ks+6br6rbqyrquyrLu27au+7KtC7vourauyq6uq7Ks67It67Zs20LJ81TVM03X9UzTdVXXtW3VdW1bM03XNV1XlkXVdWXVlXVddWVb90zTdU1XlWXTVWVZlWXddmVXl0XXtW1Vln1ddWVfl23d92VZ133TdXVblWXbV2VZ92Vd94VZt33dU1VbN11X103X1X1b131htm3fF11X11XZ1oVVlnXf1n1lmHWdMLqurqu27OuqLOu+ruvGMOu6MKy6bfyurQvDq+vGseu+rty+j2rbvvDqtjG8um4cu7Abv+37xrGpqm2brqvrpivrumzrvm/runGMrqvrqiz7uurKvm/ruvDrvi8Mo+vquirLurDasq/Lui4Mu64bw2rbwu7aunDMsi4Mt+8rx68LQ9W2heHVdaOr28ZvC8PSN3a+AACAAQcAgAATykChISsCgDgBAAYhCBVjECrGIIQQUgohpFQxBiFjDkrGHJQQSkkhlNIqxiBkjknIHJMQSmiplNBKKKWlUEpLoZTWUmotptRaDKG0FEpprZTSWmopttRSbBVjEDLnpGSOSSiltFZKaSlzTErGoKQOQiqlpNJKSa1lzknJoKPSOUippNJSSam1UEproZTWSkqxpdJKba3FGkppLaTSWkmptdRSba21WiPGIGSMQcmck1JKSamU0lrmnJQOOiqZg5JKKamVklKsmJPSQSglg4xKSaW1kkoroZTWSkqxhVJaa63VmFJLNZSSWkmpxVBKa621GlMrNYVQUgultBZKaa21VmtqLbZQQmuhpBZLKjG1FmNtrcUYSmmtpBJbKanFFluNrbVYU0s1lpJibK3V2EotOdZaa0ot1tJSjK21mFtMucVYaw0ltBZKaa2U0lpKrcXWWq2hlNZKKrGVklpsrdXYWow1lNJiKSm1kEpsrbVYW2w1ppZibLHVWFKLMcZYc0u11ZRai621WEsrNcYYa2415VIAAMCAAwBAgAlloNCQlQBAFAAAYAxjjEFoFHLMOSmNUs45JyVzDkIIKWXOQQghpc45CKW01DkHoZSUQikppRRbKCWl1losAACgwAEAIMAGTYnFAQoNWQkARAEAIMYoxRiExiClGIPQGKMUYxAqpRhzDkKlFGPOQcgYc85BKRljzkEnJYQQQimlhBBCKKWUAgAAChwAAAJs0JRYHKDQkBUBQBQAAGAMYgwxhiB0UjopEYRMSielkRJaCylllkqKJcbMWomtxNhICa2F1jJrJcbSYkatxFhiKgAA7MABAOzAQig0ZCUAkAcAQBijFGPOOWcQYsw5CCE0CDHmHIQQKsaccw5CCBVjzjkHIYTOOecghBBC55xzEEIIoYMQQgillNJBCCGEUkrpIIQQQimldBBCCKGUUgoAACpwAAAIsFFkc4KRoEJDVgIAeQAAgDFKOSclpUYpxiCkFFujFGMQUmqtYgxCSq3FWDEGIaXWYuwgpNRajLV2EFJqLcZaQ0qtxVhrziGl1mKsNdfUWoy15tx7ai3GWnPOuQAA3AUHALADG0U2JxgJKjRkJQCQBwBAIKQUY4w5h5RijDHnnENKMcaYc84pxhhzzjnnFGOMOeecc4wx55xzzjnGmHPOOeecc84556CDkDnnnHPQQeicc845CCF0zjnnHIQQCgAAKnAAAAiwUWRzgpGgQkNWAgDhAACAMZRSSimllFJKqKOUUkoppZRSAiGllFJKKaWUUkoppZRSSimllFJKKaWUUkoppZRSSimllFJKKaWUUkoppZRSSimllFJKKaWUUkoppZRSSimllFJKKaWUUkoppZRSSimllFJKKaWUUkoppZRSSimllFJKKaWUUkoppZRSSimVUkoppZRSSimllFJKKaUAIN8KBwD/BxtnWEk6KxwNLjRkJQAQDgAAGMMYhIw5JyWlhjEIpXROSkklNYxBKKVzElJKKYPQWmqlpNJSShmElGILIZWUWgqltFZrKam1lFIoKcUaS0qppdYy5ySkklpLrbaYOQelpNZaaq3FEEJKsbXWUmuxdVJSSa211lptLaSUWmstxtZibCWlllprqcXWWkyptRZbSy3G1mJLrcXYYosxxhoLAOBucACASLBxhpWks8LR4EJDVgIAIQEABDJKOeecgxBCCCFSijHnoIMQQgghREox5pyDEEIIIYSMMecghBBCCKGUkDHmHIQQQgghhFI65yCEUEoJpZRSSucchBBCCKWUUkoJIYQQQiillFJKKSGEEEoppZRSSiklhBBCKKWUUkoppYQQQiillFJKKaWUEEIopZRSSimllBJCCKGUUkoppZRSQgillFJKKaWUUkooIYRSSimllFJKCSWUUkoppZRSSikhlFJKKaWUUkoppQAAgAMHAIAAI+gko8oibDThwgMQAAAAAgACTACBAYKCUQgChBEIAAAAAAAIAPgAAEgKgIiIaOYMDhASFBYYGhweICIkAAAAAAAAAAAAAAAABE9nZ1MABAgkAAAAAAAAfJqaEQIAAAB89IOyJjhEQUNNRE5TRENHS0xTRllHSEpISUdORk1GSEdISUNHP0ZHS1IhquPYHv5OAgC/7wFATp2pUBdXuyHsT4XRISOWEsj9QgEA7CC99FBIaDsrM+hbibFaAl81wg+vGnum4/p5roRKJAAAQFGOdsUy794bb3kbX50b8wL0NECgHlr67FRjAIAlBqKQyl55KU64p02UMHrBl0yZbWiGBSJYvJwiAaLj+vfck0gAnrsDAJV8Gl9y2ovHlFW+iSn7ZmRlQAb9lx4A4hz/EEPP9W5bRn5ldI8wU4fR+xS3ZLKtvYvVL687nuL6t9yTeAC+RwCEqOwlsbp1/8nH92xUT3KcsFhk7T4kAADwbXSbV8XCH6fYyccR20ceVzbp65K8wTKt7i29DHrNRpbg+llWQiUAAABh8SfmNYz1zNJvVm/6ZulEwE4BZEcYiZ+X5QQAsDib+e7cFjM7i9MfI304kTbyzFlUlxMZW92vpQmnJf6GaI40HUgUhuDlGH4SiwBwPQCEotz12nIjLju/n4bWM2RrhQP26bAAAEJxvd5Y66S0Bk6b+hozw2kzVccJx/ajEnnIWdBXbMON0UJ+YC/LJwGAawygypSJUV3enfpuR4a1NshSpqhl1t95c7XpMobYmrGOdWy9kMLS280QcKu7WxbJ2uukrVrMMMQ2V6o4GbYBVyi1zt6mTwOW4r0O3hJoAMA1A1AVxeA82nYulS/PeZS76iiXQcld82TW68AVRVaGbYu3pYy2dCtv2WPZTW4aze95YsP2ht8H9ob2sHdj2aP5xvzGMvrcPuw3DJbg+pl7SwAA4JoQAKEoRmuTA1datn0ll4M+RDIgwepTegCAqZXJwi4+D9CbO9co4qTOEo4nJQk1ilBItSPefZhsCFADluD6mXtLQDYAeKoOQCiygt5MbOFxku9OoakVCRshIH7t0QMAsAvYnyc9wcaLOrepVBelSJ5YqXw57wGbOJf0QmBIAZbf+pi9JQgIAHxPBiAUZSwOroLZG1W7/N3+lCr8SBC1+1oAAKDoRWT56b6YcafEq0xsUDbM+7p712GNyfWWOMh+MX2y9t4Ajt/60d4SAAAwYQCEVXkuoAma6qXER1ZLu2GlDQLBvwcdACAPR5Sb2vYgzJ8uxdxSE127cNRnPpdsJZ4NMndjTdbblB/nE1PKjWcAjt8RjScBgH4SQJUpY3MiJTGRJmXGjImpRAjBZs1sNmtM5P86m3EcU5cSkC9b8eY3Pp96HVJjwP4rz19qS8yY4sW8W9OlKl2BeJw8EZbioceTAMBzBqAqyl4y2V0me0/D3qUeI3cIURT5Wytli7flLsdxKBaV7aIcRMOhcDROe6VmZlx8Wvfo9JnMW+Xfqsv0ynjdVK/MzFQbMjPVmTkrit5ivp0EAHbCAAjFHZ+WVE/2qWubq96d1HGjRkCYMmYAQLOZZYEblKknCTLC3Fla72pISpk4z9x1sjuZrttub1LUJ7vpBIreXQKXAFwDg6IcCzOmDu0NiSNTR+7tTyQSiRBGE4e+2JLycuv6ere1P1Pl8/Y/biuttqVa0RuwLXKPW2JbWh8qGysH3pXVYRofzOW4oS9KVk6oeZa7BHcclt8xp28J0ABA1QAIRZnKdDQLZzv2vZR6R7SDCNLiDPu/JgCA2ddgPznKws0y9ko0o/FZp5UKN2aTLwFhOkzbGk7Ev69tHACS3/oxe0tAAgCf9wAIRVawTrOhvznPSHXcBU3RRqYNQTr+bQUAgMqdkd316ov0ymXJ8FLa1f8b79fj3R4By8t8Dk5FPP5LnAiS3/rwviUAAHBNCICw+Ht66212jr0bz0zNqNLUqFY1A9xMaQEANp/b9ba5yPZORo4ec5Hx/Coj7MILu6hGm9Hp5ijH2FmPQjZqAZLferjfEhAAwFYdgFCUiWYwt9TVuWGVr8cm59axURwJOqv0AMAj50k+vICuG/fuoNnVN2t7+a9VtsYCea7kqrItmTnEQa79GYrfenjfEhANAJ4RAKEouzmardahkP4tso7fBsViChGWqgUAYKA7f720O5LqX9FXzSku1sC3tVHxq++uVfaXuowa3NJx6Ks0egOG3iWGneQAsBMEIBT/zXRNrr38c9rdz2qpCpgB6gqDNADApWZZSvcm7VyTo1yW3Vs1q8xMmgEBWwoze23kQBDMDRPt7i4hC5LfIY+nDgDk5ACwwnowLLvft7ekXds5nezEig0nclrDi8Or66XICZaq4ime564bwYdBWO8dvmfNrsCSW5AeWe1ifN2R9nS21RC4NME1A4rh4lzfEiQAQE8QgFCUaTOXH1J3pjkwKlntkpRBWCvsIb8OAKANWER83tlHOBVJaZ2NJWXKSqhgA34zuOPehVVh/B3ICQOO4KK+3xIQAMDnfQBSpxrzCH2U6pHp7WZ6PwyCqAkm+eWrBAA4Kdb8uJEp5f1dXgrhcvR9MoeMyzG0i/uYgHyN0jrNek+GubvriIm6G47hor7fEgAAUCUAobJUrNbG3GOY9blo5oPOduQP0lqkd7UeALwgdweI4PWcyLTRw5Fdntehe/trjP5IJSJznmuLpm7H2AGG4GLMbiUAAPDcAAiLpczJlR2n60F9PErm8YqNiQOyfr9UAQB2KTnX3MdFOTMzJcfCSrwWl1HWIzI7uxB1TsQuEPx9LoN6hgCG4GLMbiVAA4CtGgChVrYNbTwU1eZqiFJ5aigd6zgQrfzXAQCU0XsD+QyRUGiFAr5hrfR2sPZgJsjrhXh7P8+AqkfZQ0B8BoZeVea3BOQCgJ4IQKgsr2dxyXYl7caDKOsvx4ppZRDYXakBABCbnhZ61lw0GWo5b34cYxZ5CVel7QjFunVc7uMuNtizydMTHIZdVecn8QBcJwAylf/guBJzi/V87Sae+JlHxQYbsKPLKgAQAOso9x00mcrgiC+iUmxOnvchtha7pB1piFRd2YyH3IQ9+rS5KA2CYFT+JwEAVQIQimTsNSzPy/J8ZphM3e2dDMHaEES8/lovAQhg5HLoVVKXxj1K71I7cJxAeWFDYcfOIR/LcsdhJeo5fuBRhicBgKcBCJVqdk5erKV2T6fejJ4y5zkhsYgwewHAUnpnobQUEvXMdFbKoF3tzr9dP6htsqXVgL7D6TN0HnVL38UVkQ164xGPtyQhAICtAGC5fMRbGFCeNkvX5h6nXQxEIQBlWQ0AACaNu+sdjcTc3HKvtL7+nrprlFMlxCGXw0Jg6wN+nYqXkwBATwE4A8AfreeeYJ3ee/G0MzGii4iwVtrHNQ0AQBWg7wMR1wL09Ywau3DR1Lr3zU2kmxYEJR0NgtRDdnEio4ZJdl4Vo1sCBAC4TgCBQTY2QLPnmPkpfS846yNWBgKOXd5JSADArF9HjUZd1KCzNse+k3ck7bCGnfr+6eHjs1m4k9cQsPUEHQB+n8LpSXQAjAHkrLI094zNHePypKdf9RIWN0lIy/Bx1JECYkgi481PP5FG1l/fLPa51xrTFkIuUqPIjTxdY0Qh6riz3rXJ/vF0dkSSW9DTqgAAmeJx/scynl627KXON973XgpjzRJ1Hj6/CMlCc+hfQ6eIKQm7nLAMh3X1YorEW8vqOL44wn79D/pIETNBW/AzzX9681U4DJzb4PYDesvZ34xswFUCkGrRAGD1Nx4AeF4pACxWbrDxrjgDwBwF'; audio.setAttribute("id", "ding_noise"); audio.volume = 1; function newHits(dingNoise) { console.log(dingNoise); if (dingNoise || newHitDing) document.getElementById("ding_noise").play(); } //For editing the blocklist var div = document.createElement('div'); var textarea = document.createElement('textarea'); div.style.position = 'fixed'; div.style.width = '500px'; div.style.height = '235px'; div.style.left = '50%'; div.style.right = '50%'; div.style.margin = '-250px 0px 0px -250px'; div.style.top = '300px'; div.style.padding = '5px'; div.style.border = '2px'; div.style.backgroundColor = 'black'; div.style.color = 'white'; div.style.zIndex = '100'; div.setAttribute('id','block_div'); textarea.style.padding = '2px'; textarea.style.width = '500px'; textarea.style.height = '180px'; textarea.title = 'Block list'; textarea.setAttribute('id','block_text'); div.textContent = 'Change the blocklist to be whatever you like, save to save it. Separate requesters with the ^ character. After clicking "Save", you\'ll need to scrape again to apply the changes.'; div.style.fontSize = '12px'; div.appendChild(textarea); var save_button = document.createElement('button'); var cancel_button = document.createElement('button'); save_button.textContent = 'Save'; save_button.setAttribute('id', 'save_blocklist'); save_button.style.height = '18px'; save_button.style.width = '100px'; save_button.style.fontSize = '10px'; save_button.style.paddingLeft = '3px'; save_button.style.paddingRight = '3px'; save_button.style.backgroundColor = 'white'; save_button.style.marginLeft = '5px'; cancel_button.textContent = 'Cancel'; cancel_button.setAttribute('id', 'cancel_blocklist'); cancel_button.style.height = '18px'; cancel_button.style.width = '100px'; cancel_button.style.fontSize = '10px'; cancel_button.style.paddingLeft = '3px'; cancel_button.style.paddingRight = '3px'; cancel_button.style.backgroundColor = 'white'; cancel_button.style.marginLeft = '5px'; div.appendChild(save_button); div.appendChild(cancel_button); $("#block_div").hide(); save_button.addEventListener("click", function() {save_blocklist();}, false); cancel_button.addEventListener("click", function() {$("#block_div").hide();}, false); document.body.insertBefore(div, document.body.firstChild); //For editing the include list var shouldInclude = false; var div2 = document.createElement('div'); var textarea2 = document.createElement('textarea'); div2.style.position = 'fixed'; div2.style.width = '500px'; div2.style.height = '235px'; div2.style.left = '50%'; div2.style.right = '50%'; div2.style.margin = '-250px 0px 0px -250px'; div2.style.top = '300px'; div2.style.padding = '5px'; div2.style.border = '2px'; div2.style.backgroundColor = 'black'; div2.style.color = 'white'; div2.style.zIndex = '100'; div2.setAttribute('id','include_div'); textarea2.style.padding = '2px'; textarea2.style.width = '500px'; textarea2.style.height = '180px'; textarea2.title = 'include list'; textarea2.setAttribute('id','include_text'); div2.textContent = 'Used if you only want to see certain requesters. Separator is ^. Only takes effect if \"Use includelist\" is checked.'; div2.style.fontSize = '12px'; div2.appendChild(textarea2); var save_button2 = document.createElement('button'); var cancel_button2 = document.createElement('button'); save_button2.textContent = 'Save'; save_button2.setAttribute('id', 'save_includelist'); save_button2.style.height = '18px'; save_button2.style.width = '100px'; save_button2.style.fontSize = '10px'; save_button2.style.paddingLeft = '3px'; save_button2.style.paddingRight = '3px'; save_button2.style.backgroundColor = 'white'; save_button2.style.marginLeft = '5px'; cancel_button2.textContent = 'Cancel'; cancel_button2.setAttribute('id', 'cancel_includelist'); cancel_button2.style.height = '18px'; cancel_button2.style.width = '100px'; cancel_button2.style.fontSize = '10px'; cancel_button2.style.paddingLeft = '3px'; cancel_button2.style.paddingRight = '3px'; cancel_button2.style.backgroundColor = 'white'; cancel_button2.style.marginLeft = '5px'; div2.appendChild(save_button2); div2.appendChild(cancel_button2); $("#include_div").hide(); save_button2.addEventListener("click", function() {save_includelist();}, false); cancel_button2.addEventListener("click", function() {$("#include_div").hide();}, false); document.body.insertBefore(div2, document.body.firstChild); function save_blocklist() { console.log("Save"); var textarea = $("#block_text"); var text = textarea.val(); var block_list = text.split("^"); var trimmed_list = []; for (var requester in block_list){ if (block_list[requester].trim().length != 0) trimmed_list.push(block_list[requester].toLowerCase().trim()); } console.log(trimmed_list); GM_setValue("scraper_ignore_list",trimmed_list.join('^')); ignore_list = GM_getValue("scraper_ignore_list").split('^'); console.log("Save complete: "); console.log(ignore_list); $("#block_div").hide(); } function save_includelist() { console.log("Save"); var textarea = $("#include_text"); var text = textarea.val(); var includes = text.split("^"); console.log(includes); var trimmed_list = []; for (var requester in includes){ if (includes[requester].trim().length != 0) trimmed_list.push(includes[requester].toLowerCase().trim()); } GM_setValue("scraper_include_list",trimmed_list.join('^')); include_list = GM_getValue("scraper_include_list").split('^'); console.log(include_list); $("#include_div").hide(); } var HITStorage = {}; var indexedDB = window.indexedDB || window.webkitIndexedDB || window.mozIndexedDB; window.IDBTransaction = window.IDBTransaction || window.webkitIDBTransaction || window.mozIDBTransaction; window.IDBKeyRange = window.IDBKeyRange || window.webkitIDBKeyRange || window.mozIDBKeyRange; HITStorage.IDBTransactionModes = { "READ_ONLY": "readonly", "READ_WRITE": "readwrite", "VERSION_CHANGE": "versionchange" }; var IDBKeyRange = window.IDBKeyRange; HITStorage.indexedDB = {}; HITStorage.indexedDB = {}; HITStorage.indexedDB.db = null; HITStorage.indexedDB.onerror = function(e) { console.log(e); }; var v=4; HITStorage.indexedDB.checkTitle = function(title,button) { var request = indexedDB.open("HITDB", v); request.onsuccess = function(e) { HITStorage.indexedDB.db = e.target.result; var db = HITStorage.indexedDB.db; if (!db.objectStoreNames.contains("HIT")) { db.close(); return; } var trans = db.transaction(["HIT"], HITStorage.IDBTransactionModes.READ_ONLY); var store = trans.objectStore("HIT"); var index = store.index("title"); index.get(title).onsuccess = function(event) { if (event.target.result === undefined) { console.log(title + ' not found'); history[button].titledb=false; } else { console.log(title + ' found'); history[button].titledb=true; } db.close(); }; }; request.onerror = HITStorage.indexedDB.onerror; }; HITStorage.indexedDB.checkRequester = function(id,button) { var request = indexedDB.open("HITDB", v); request.onsuccess = function(e) { HITStorage.indexedDB.db = e.target.result; var db = HITStorage.indexedDB.db; if (!db.objectStoreNames.contains("HIT")) { db.close(); return; } var trans = db.transaction(["HIT"], HITStorage.IDBTransactionModes.READ_ONLY); var store = trans.objectStore("HIT"); var index = store.index("requesterId"); index.get(id).onsuccess = function(event) { if (event.target.result === undefined) {history[button].reqdb=false; console.log(id + ' not found'); } else { history[button].reqdb=true; console.log(id + ' found'); } db.close(); }; }; request.onerror = HITStorage.indexedDB.onerror; }; var PAGES_TO_SCRAPE = 3; var MINIMUM_HITS = 100; var SEARCH_REFRESH=0; var URL_BASE = "/mturk/searchbar?searchWords=&selectedSearchType=hitgroups"; var initial_url = URL_BASE; var TO_REQ_URL = "http://turkopticon.ucsd.edu/reports?id="; var found_key_list=[]; var last_clear_time = new Date().getTime(); var searched_once = false; var save_new_results_time = 120; var save_results_time = 3600; var default_type = 0; var cur_loc = window.location.href; var time_input = document.createElement("INPUT"); time_input.value = 0; var page_input = document.createElement("INPUT"); page_input.value = 3; var min_input = document.createElement("INPUT"); var new_time_display_input = document.createElement("INPUT"); new_time_display_input.value = 300; var reward_input = document.createElement("INPUT"); var qual_input = document.createElement("INPUT"); qual_input.type = "checkbox"; qual_input.checked = true; var masters_input = document.createElement("INPUT"); masters_input.type = "checkbox"; var sort_input1 = document.createElement("INPUT"); sort_input1.type = "radio"; sort_input1.name = "sort_type"; sort_input1.value = "latest"; sort_input1.checked = true; var sort_input2 = document.createElement("INPUT"); sort_input2.type = "radio"; sort_input2.name = "sort_type"; sort_input2.value = "most"; var sort_input3 = document.createElement("INPUT"); sort_input3.type = "radio"; sort_input3.name = "sort_type"; sort_input3.value = "amount"; var sort_input4 = document.createElement("INPUT"); sort_input4.type = "radio"; sort_input4.name = "sort_type"; sort_input4.value = "A-Z"; var sort_input_invert = document.createElement("INPUT"); sort_input_invert.type = "checkbox"; var friesAreDone = document.createElement("INPUT"); friesAreDone.type = "checkbox"; var correctForSkips = document.createElement("INPUT"); correctForSkips.type = "checkbox"; correctForSkips.checked = true; var matchOnly = document.createElement("INPUT"); matchOnly.type = "checkbox"; var search_input = document.createElement("INPUT"); var LINK_BASE = "https://www.mturk.com"; var STATUSDETAIL_DELAY = 250; var MPRE_DELAY = 3000; $('body').css('background', BACKGROUND_COLOR); var next_page = 1; var API_PROXY_BASE = 'https://mturk-api.istrack.in/'; var API_MULTI_ATTRS_URL = API_PROXY_BASE + 'multi-attrs.php?ids='; var REVIEWS_BASE = 'http://turkopticon.ucsd.edu/'; var control_panel_HTML = '
'; $('body > :not(#control_panel)').hide(); //hide all nodes directly under the body $('body').prepend(control_panel_HTML); var control_panel = document.getElementById("control_panel"); var big_red_button = document.createElement("BUTTON"); var reset_blocks = document.createElement("BUTTON"); var include_button = document.createElement("BUTTON"); var progress_report = document.createTextNode("Stopped"); var status_report = document.createTextNode("None"); var text_area = document.createElement("TABLE"); big_red_button.textContent = "Show Interface"; big_red_button.onclick = function(){show_interface();}; control_panel.appendChild(big_red_button); show_interface(); var global_run = false; var statusdetail_loop_finished = false; var date_header = ""; var history = {}; var wait_loop; function set_progress_report(text, force) { if (global_run == true || force == true) { progress_report.textContent = text; status_report.textContent = status_text; } } function get_progress_report() { return progress_report.textContent; } function wait_until_stopped() { if (global_run == true) { if (statusdetail_loop_finished == true) { big_red_button.textContent = "Start"; set_progress_report("Finished", false); } else { setTimeout(function(){wait_until_stopped();}, 500); } } } function display_wait_time(wait_time) { if (global_run == true) { var current_progress = get_progress_report(); if (current_progress.indexOf("Searching again in")!==-1) { set_progress_report(current_progress.replace(/Searching again in \d+ seconds/ , "Searching again in " + wait_time + " seconds"),false); } else set_progress_report(current_progress + " Searching again in " + wait_time + " seconds.", false); if (wait_time>1) setTimeout(function(){display_wait_time(wait_time-1);}, 1000); } } function dispArr(ar) { var disp = ""; for (var z = 0; z < ar.length; z++) { disp += "id " + z + " is " + ar[z] + " "; } console.log(disp); } function scrape($src) { var $requester = $src.find('a[href^="/mturk/searchbar?selectedSearchType=hitgroups&requester"]'); var $title = $src.find('a[class="capsulelink"]'); var $reward = $src.find('span[class="reward"]'); var $preview = $src.find('a[href^="/mturk/preview?"]'); var $qualified = $src.find('a[href^="/mturk/notqualified?"]'); var $times = $src.find('a[id^="duration_to_complete"]'); var $descriptions = $src.find('a[id^="description"]'); var not_qualified_group_IDs=[]; var $quals = $src.find('a[id^="qualificationsRequired"]'); $qualified.each(function(){ var groupy = $(this).attr('href'); groupy = groupy.replace(/\/mturk\/notqualified\?hitGroupId=([A-Z0-9]+)(&.+)?/,"$1"); groupy = groupy.replace("/mturk/notqualified?hit",""); not_qualified_group_IDs.push(groupy); }); var $mixed = $src.find('a[href^="/mturk/preview?"],a[href^="/mturk/notqualified?"]'); var listy =[]; $mixed.each(function(){ var groupy = $(this).attr('href'); groupy = groupy.replace(/\/mturk\/notqualified\?hitGroupId=([A-Z0-9]+)(&.+)?/,"$1"); groupy = groupy.replace("/mturk/notqualified?hit",""); groupy = groupy.replace("/mturk/preview?groupId=",""); listy.push(groupy); }); listy = listy.filter(function(elem, pos) { return listy.indexOf(elem) == pos; }); for (var j = 0; j < $requester.length; j++) { var $hits = $requester.eq(j).parent().parent().parent().parent().parent().parent().find('td[class="capsule_field_text"]'); var requester_name = $requester.eq(j).text().trim(); var requester_link = $requester.eq(j).attr('href'); var group_ID=(listy[j] ? listy[j].replace(/\/mturk\/notqualified\?hitGroupId=([A-Z0-9]+)(&.+)?/,"$1") : ""); if (listy[j] && listy[j].indexOf("notqualified") > -1) noqual = true; group_ID=group_ID.replace("/mturk/notqualified?hit",""); var masters = false; var preview_link = "/mturk/preview?groupId=" + group_ID; var title = $title.eq(j).text().trim(); var reward = $reward.eq(j).text().trim(); var hits = $hits.eq(4).text().trim(); var time = $times.eq(j).parent()[0].nextSibling.nextSibling.innerHTML; var description = $descriptions.eq(j).parent()[0].nextSibling.nextSibling.innerHTML; //console.log(description); var requester_id = requester_link.replace('/mturk/searchbar?selectedSearchType=hitgroups&requesterId=',''); var accept_link; accept_link = preview_link.replace('preview','previewandaccept'); /*HIT SCRAPER ADDITION*/ var qElements = $quals.eq(j).parent().parent().parent().find('tr'); //console.log(qElements); var qualifications = []; for (var i = 1; i < qElements.length; i++) { qualifications.push((qElements[i].childNodes[1].textContent.trim().replace(/\s+/g, ' ').indexOf("Masters") != -1 ? "[color=red][b]"+qElements[i].childNodes[1].textContent.trim().replace(/\s+/g, ' ')+"[/b][/color]" : qElements[i].childNodes[1].textContent.trim().replace(/\s+/g, ' '))); if (qElements[i].childNodes[1].textContent.trim().replace(/\s+/g, ' ').indexOf("Masters") != -1) masters=true; } var qualList = (qualifications.join(', ') ? qualifications.join(', ') : "None"); key = requester_name+title+reward+group_ID; found_key_list.push(key); if (history[key] == undefined) { history[key] = {requester:"", title:"", description:"", reward:"", hits:"", req_link:"", quals:"", prev_link:"", rid:"", acc_link:"", new_result:"", qualified:"", found_this_time:"", initial_time:"", reqdb:"",titledb:"",time:"",masters:false}; history[key].req_link = requester_link; history[key].prev_link = preview_link; history[key].requester = requester_name; history[key].title = title; history[key].reward = reward; history[key].hits = hits; history[key].rid = requester_id; history[key].acc_link = accept_link; history[key].time = time; history[key].quals = qualList; history[key].description = description; history[key].masters = masters; HITStorage.indexedDB.checkRequester(requester_id,key); HITStorage.indexedDB.checkTitle(title,key); if (searched_once) { history[key].initial_time = new Date().getTime();//-1000*(save_new_results_time - SEARCH_REFRESH); history[key].new_result = 0; } else { history[key].initial_time = new Date().getTime()-1000*save_new_results_time; history[key].new_result = 1000*save_new_results_time; } if (not_qualified_group_IDs.indexOf(group_ID)!==-1) history[key].qualified = false; else history[key].qualified = true; history[key].found_this_time = true; } else { history[key].new_result = new Date().getTime() - history[key].initial_time; history[key].found_this_time = true; history[key].hits = hits; } } } function statusdetail_loop(next_URL) { if (global_run == true) { if (next_URL.length != 0) { $.get(next_URL, function(data) { var $src = $(data); var maxpagerate = $src.find('td[class="error_title"]:contains("You have exceeded the maximum allowed page request rate for this website.")'); if (maxpagerate.length == 0) { if (next_page > PAGES_TO_SCRAPE) { if(status_text.indexOf("Correcting for skips") == -1) status_text += ". Correcting for skips"; } set_progress_report("Processing page " + next_page, false); scrape($src); $next_URL = $src.find('a[href^="/mturk/viewsearchbar"]:contains("Next")'); next_URL = ($next_URL.length != 0) ? $next_URL.attr("href") : ""; next_page++; if (default_type == 1) { var hmin = MINIMUM_HITS+1; for (j = 0; j < found_key_list.length; j++) { console.log(history[found_key_list[j]]); if (history[found_key_list[j]].hits < hmin) { next_URL = ""; next_page = -1; break; } } } else if (next_page > PAGES_TO_SCRAPE && correct_for_skips) { var skipped_hits = 0; var added_pages = 0; for (j = 0; j < found_key_list.length; j++) { var obj = history[found_key_list[j]]; if (!ignore_check(obj.requester,obj.title)) skipped_hits++; } added_pages = Math.floor(skipped_hits/10); if (skipped_hits%10 >6) added_pages++; if (next_page > PAGES_TO_SCRAPE + added_pages) { next_URL = ""; next_page = -1; } } else if (next_page > PAGES_TO_SCRAPE) { next_URL = ""; next_page = -1; } setTimeout(function(){statusdetail_loop(next_URL);}, STATUSDETAIL_DELAY); } else { console.log("MPRE"); setTimeout(function(){statusdetail_loop(next_URL);}, MPRE_DELAY); } }); } else { searched_once = true; var found_hits = found_key_list.length; var shown_hits = 0; var new_hits = 0; var url = API_MULTI_ATTRS_URL; var rids = []; var lastRow = text_area.rows.length - 1; for (i = lastRow; i>0; i--) text_area.deleteRow(i); for (j = 0; j < found_key_list.length; j++) { //(function(url,rids,j) { var obj = history[found_key_list[j]]; if (ignore_check(obj.requester,obj.title) && obj.found_this_time){ ++shown_hits; //console.log(obj); //hit export will update col_heads[1] var col_heads = ["" + obj.requester + "","" + obj.title + "",obj.reward,obj.hits,"TO down","Accept","M"]; var row = text_area.insertRow(text_area.rows.length); url += obj.rid + ','; rids.push(obj.rid); if (check_hitDB) { col_heads.push("R"); col_heads.push("T"); } if (!obj.qualified) { col_heads.push("Not Qualified"); } for (i=0; iDate | Requester | HIT Title | Reward | Status | Feedback |
---|---|---|---|---|---|
$' + sum.toFixed(2) + ' |
Found " + results.length + " matching HITs. $" + sum_approved.toFixed(2) + " approved, " + "$" + sum_rejected.toFixed(2) + " rejected and $" + sum_pending.toFixed(2) + " pending.
"); resultsWindow.document.write("") resultsWindow.document.close(); } function export_func(item) { HIT = item; edit_button.textContent = 'Edit Template'; apply_template(item); div.style.display = 'block'; textarea.select(); } function apply_template(hit_data) { var txt = TEMPLATE; var vars = ['title', 'requester', 'rid', 'description', 'reward', 'quals', 'prev_link', 'time', 'hits', 'to_stuff', 'to_text']; var resp = null; if (txt.indexOf('{to_text}') >= 0 || txt.indexOf('{to_stuff}') >= 0){ var url = buildXhrUrl(hit_data["rid"]); resp = makeXhrQuery(url); //console.log(resp); } var toText = ""; var toStuff = ""; var toData = ""; var numResp = (resp == null || resp == "TO DOWN" ? "n/a" : resp[hit_data["rid"]].reviews); if (resp == "TO DOWN"){ toStuff = " [URL=\""+TO_BASE+hit_data['rid']+"\"]TO down.[/URL]"; toText = toStuff; } else if (resp == null || resp[hit_data["rid"]].attrs == null && resp != "TO DOWN") { toStuff = " No TO "; toText = " No TO "; toStuff += "[URL=\""+TO_BASE+"report?requester[amzn_id]=" + hit_data['rid'] + "&requester[amzn_name]=" + hit_data['requester'] + "\"]"; toStuff += "(Submit a new TO rating for this requester)[/URL]"; } else { for (var key in resp[hit_data["rid"]].attrs) { //toText += "\n[*]"+key+": "+resp[hit_data["requesterId"]].attrs[key]+"\n"; var i = 0; var color = "green"; var name = key; var num = Math.floor(resp[hit_data["rid"]].attrs[key]); switch (key){ case "comm": name = "Communicativity"; break; case "pay": name = "Generosity"; break; case "fast": name = "Promptness"; break; case "fair": name = "Fairness"; break; default: name = key; break; } switch (num){ case 0: color = "red"; break; case 1: color = "red"; break; case 2: color = "orange"; break; case 3: color = "yellow"; break; default: break; } toText += (num > 0 ? "\n[color="+color+"]" : "\n"); for (i; i < num; i++){ toText += "[b]"+symbol+"[/b]" } toText += (num > 0 ? "[/color]" : "") if (i < 5){ toText += "[color=white]"; for (i; i < 5; i++) toText += "[b]"+symbol+"[/b]"; toText += "[/color]"; } toText += " "+Number(resp[hit_data["rid"]].attrs[key]).toFixed(2)+" "+name; toData += Number(resp[hit_data["rid"]].attrs[key]).toFixed(2) + ","; } //toText += "[/list]"; toText += (txt.indexOf('{to_stuff}') >= 0 ? "" : "\nNumber of Reviews: "+numResp+"\n[URL=\""+TO_BASE+"report?requester[amzn_id]=" + hit_data['rid'] + "&requester[amzn_name]=" + hit_data['requester'] + "\"](Submit a new TO rating for this requester)[/URL]"); toStuff = '\n[img]http://data.istrack.in/to/' + toData.slice(0,-1) + '.png[/img]'; toStuff += (txt.indexOf('{to_stuff}') >= 0 ? (txt.indexOf('{to_text}') >= 0 ? "" : toText) : ""); toStuff += "\nNumber of Reviews: "+numResp; toStuff += "[URL=\""+TO_BASE+"report?requester[amzn_id]=" + hit_data['rid'] + "&requester[amzn_name]=" + hit_data['requester'] + "\"]"; toStuff += "\n(Submit a new TO rating for this requester)[/URL]"; } for (var i = 0; i < vars.length; i++) { t = new RegExp('\{' + vars[i] + '\}', 'g'); if (vars[i] == "to_stuff") { txt = txt.replace(t, toStuff); } else if (vars[i] == "to_text"){ txt = txt.replace(t, toText); } else if (vars[i] == "prev_link"){ txt = txt.replace(t,"https://www.mturk.com"+hit_data[vars[i]]); } else if (vars[i] == "acc_link"){ txt = txt.replace(t,"https://www.mturk.com"+hit_data[vars[i]]); } else txt = txt.replace(t, hit_data[vars[i]]); } textarea.value = txt; } function hide_func(div) { if (EDIT == false) div.style.display = 'none'; } function edit_func() { if (EDIT == true) { EDIT = false; TEMPLATE = textarea.value; edit_button.textContent = 'Edit Template'; apply_template(HIT); } else { console.log("Editing"); EDIT = true; edit_button.textContent = 'Show Changes'; save_button.disabled = false; textarea.value = TEMPLATE; } } function default_func() { GM_deleteValue('HITScraper Template'); TEMPLATE = DEFAULT_TEMPLATE; EDIT = false; edit_button.textContent = 'Edit Template'; apply_template(HIT); } function save_func() { if (EDIT) TEMPLATE = textarea.value; GM_setValue('HITScraper Template', TEMPLATE); } var div = document.createElement('div'); var textarea = document.createElement('textarea'); var div2 = document.createElement('label'); div.style.position = 'fixed'; div.style.width = '500px'; div.style.height = '235px'; div.style.left = '50%'; div.style.right = '50%'; div.style.margin = '-250px 0px 0px -250px'; div.style.top = '300px'; div.style.padding = '5px'; div.style.border = '2px'; div.style.backgroundColor = 'black'; div.style.color = 'white'; div.style.zIndex = '100'; textarea.style.padding = '2px'; textarea.style.width = '500px'; textarea.style.height = '200px'; textarea.title = '{title}\n{requester}\n{rid}\n{description}\n{reward}\n{quals}\n{prev_link}\n{time}\n{hit}\n{to_stuff}\n{to_text}'; div.textContent = 'Press Ctrl+C to copy to clipboard. Click textarea to close'; div.style.fontSize = '12px'; div.appendChild(textarea); var edit_button = document.createElement('button'); var save_button = document.createElement('button'); var default_button = document.createElement('button'); var easy_button = document.createElement('button'); edit_button.textContent = 'Edit Template'; edit_button.setAttribute('id', 'edit_button'); edit_button.style.height = '18px'; edit_button.style.width = '100px'; edit_button.style.fontSize = '10px'; edit_button.style.paddingLeft = '3px'; edit_button.style.paddingRight = '3px'; edit_button.style.backgroundColor = 'white'; save_button.textContent = 'Save Template'; save_button.setAttribute('id', 'save_button'); save_button.style.height = '18px'; save_button.style.width = '100px'; save_button.style.fontSize = '10px'; save_button.style.paddingLeft = '3px'; save_button.style.paddingRight = '3px'; save_button.style.backgroundColor = 'white'; save_button.style.marginLeft = '5px'; easy_button.textContent = 'Change Adfly Url'; easy_button.setAttribute('id', 'easy_button'); easy_button.style.height = '18px'; easy_button.style.width = '100px'; easy_button.style.fontSize = '10px'; easy_button.style.paddingLeft = '3px'; default_button.textContent = ' D '; default_button.setAttribute('id', 'default_button'); default_button.style.height = '18px'; default_button.style.width = '20px'; default_button.style.fontSize = '10px'; default_button.style.paddingLeft = '3px'; default_button.style.paddingRight = '3px'; default_button.style.backgroundColor = 'white'; default_button.style.marginLeft = '5px'; default_button.title = 'Return default template'; div.appendChild(edit_button); div.appendChild(save_button); div.appendChild(default_button); div.appendChild(easy_button); save_button.disabled = true; div.style.display = 'none'; textarea.addEventListener("click", function() {hide_func(div);}, false); edit_button.addEventListener("click", function() {edit_func();}, false); save_button.addEventListener("click", function() {save_func();}, false); default_button.addEventListener("click", function() {default_func();}, false); document.body.insertBefore(div, document.body.firstChild);