Scrape, display, sort and search your Mturk qualifications
当前为 
// ==UserScript== // @name Mturk Qualification Database and Scraper // @namespace https://greasyfork.org/en/users/1004048-elias041 // @version 0.4 // @description Scrape, display, sort and search your Mturk qualifications // @author Elias041 // @match https://worker.mturk.com/qualifications/assigned // @match https://worker.mturk.com/qt // @require https://code.jquery.com/jquery-3.6.3.js // @require https://code.jquery.com/ui/1.13.1/jquery-ui.min.js // @require https://unpkg.com/dexie/dist/dexie.js // @require https://unpkg.com/[email protected]/dist/ag-grid-community.min.js // @require https://cdnjs.cloudflare.com/ajax/libs/moment.js/2.29.4/moment.min.js // @resource https://cdn.jsdelivr.net/npm/ag-grid-community/styles/ag-grid.css // @resource https://cdn.jsdelivr.net/npm/ag-grid-community/styles/ag-theme-apline.css // @icon https://www.google.com/s2/favicons?sz=64&domain=mturk.com // @license none // @grant none // ==/UserScript== let timeout = 1850; let counter = " "; let retry_count = 0; let page = "https://worker.mturk.com/qualifications/assigned.json?page_size=100"; let timeoutId = undefined; let scraping = false window.onload = function () { let t = document.getElementsByClassName("col-xs-5 col-md-3 text-xs-right p-l-0")[0], e = t.parentNode, o = document.createElement("div"); o.style.color = "#fff"; o.style.padding = "10px"; o.style.boxShadow = "2px 2px 4px #888888"; o.style.background = "#33773A"; o.style.opacity = "0.5"; o.style.cursor = "pointer"; o.id = "button"; o.innerHTML = "Scrape Quals"; e.insertBefore(o, t); let c = document.createElement("div"); c.style.color = "#fff"; c.style.background = "#C78D99"; c.style.padding = "10px"; c.style.boxShadow = "2px 2px 4px #888888"; c.style.background = "#383c44"; c.style.opacity = "0.5"; c.style.cursor = "pointer"; c.innerHTML = "Cancel"; c.id = "cancelButton"; e.insertBefore(c, t); let d = document.createElement("div"); d.style.color = "#fff"; d.style.background = "#fc0f03"; d.style.padding = "10px"; d.style.boxShadow = "2px 2px 4px #888888"; d.style.background = "#323552"; d.style.opacity = "0.5"; d.style.cursor = "pointer"; d.innerHTML = "Database"; d.id = "dbButton"; e.insertBefore(d, t); let f = document.createElement("div"); f.style.color = "#fff"; f.style.padding = "10px"; f.style.boxShadow = "2px 2px 4px #888888"; f.style.background = "#33773A"; f.style.opacity = "0.5"; f.id = "progress"; f.innerHTML = "-"; e.insertBefore(f, t); document.getElementById("dbButton").addEventListener("click", function e() { window.open("https://worker.mturk.com/qt", "_blank") }) document.getElementById("cancelButton").addEventListener("click", function e() { scraping = false $("#cancelButton").css('background', '#383c44') $("#button").css('background', '#33773A') $("#progress").html("-") }) document.getElementById("button").addEventListener("click", function e() { scraping = true; $("#button").css('background', '#383c44') $("#cancelButton").css('background', '#CE3132') /*init db*/ var db = new Dexie("qualifications"); db.version(1).stores( { quals: ` id, requester, description, score, date, qualName, reqURL, reqQURL, retURL, canRetake, hasTest, canRequest, isSystem` }); /*main loop*/ function getAssignedQualifications(nextPageToken = "") { if (!scraping) { return; } //cancel trap counter++ $("#progress").html(counter); //$("#progressBar").html("   Processing page " + counter + "   "); //console.log("scraping") $.getJSON(page) .then(function (data) { data.assigned_qualifications.forEach(function (t) { db.quals.bulkAdd([ { id: t.request_qualification_url, requester: t.creator_name, description: t.description, canRetake: t.can_retake_test_or_rerequest, retry: t.earliest_retriable_time, score: t.value, date: t.grant_time, qualName: t.name, reqURL: t.creator_url, retURL: t.retake_test_url, isSystem: t.is_system_qualification, canRequest: t.is_requestable, hasTest: t.has_test }]) }) if (data.next_page_token !== null) { timeoutId = setTimeout(() => { page = `https://worker.mturk.com/qualifications/assigned.json?page_size=100&next_token=${encodeURIComponent(data.next_page_token)}` getAssignedQualifications(data.next_page_token); }, timeout); } else { console.log("Scraping completed"); console.log(counter + "pages"); console.log("Timeout" + timeout); console.log(retry_count + "timeouts"); $("#cancelButton").css('background', '#383c44'); $("#progress").css('background', '#25dc12'); $("#progress").html('✓'); $("#dbButton$").css('background', '#25dc12'); } }) .catch(function (error) { //handle timeouts if (error.status === 429 && retry_count < 5) { retry_count++; timeout += 500; console.log("timed out, incrementing clock to " + timeout + " milliseconds") setTimeout(() => { getAssignedQualifications(nextPageToken); }, 10000); } else { $("#progressBar").html("Timed out 5 times, aborting. " + timeout + " milliseconds."); console.log("Timed out 5 times, aborting. " + timeout + " milliseconds."); } /* $("#button").html("Retry?"); $("#button").css("background-color", "#e80c0f"); document.getElementById("button").addEventListener("click", function e() { location.reload() }*/ } ) } getAssignedQualifications(); } ) }; /*ag-grid*/ if (location.href === "https://worker.mturk.com/qt") { document.body.innerHTML = ""; let gridDiv = document.createElement("div"); gridDiv.setAttribute("id", "gridDiv"); document.body.appendChild(gridDiv); document.title = "Qualifications"; /*init db*/ var db = new Dexie("qualifications"); db.version(1).stores( { quals: ` id, requester, description, score, date, qualName, reqURL, reqQURL, retURL, canRetake, hasTest, canRequest, isSystem` }); gridDiv.innerHTML = ` <div id="myGrid" class="ag-theme-alpine"> <style> .ag-theme-alpine { --ag-grid-size: 3px; width: 100%; height: 100%; position: absolute; top: 0; left: 0; right: 0; bottom: 0; } </style> </div>` const gridOptions = { columnDefs: [ { headerName: 'Mturk Qualification Database and Scraper', children: [ { field: "qualName" }, { field: "requester" }] }, { headerName: ' ', children: [ { field: "description", width: 350 }, { headerName: "Value", field: "score", width: 100 }, { headerName: "Date", field: "date", width: 100, valueGetter: function (params) { var date = new Date(params.data.date); return (date.getMonth() + 1) + "/" + date.getDate() + "/" + date.getFullYear(); }, comparator: function (valueA, valueB, nodeA, nodeB, isInverted) { var dateA = new Date(valueA); var dateB = new Date(valueB); return dateA - dateB; }, //valueFormatter: function(params) { // return new Date(params.value).toString().substring(4, 15); //} }, { headerName: "Requester ID", width: 150, field: "reqURL", valueFormatter: function (params) { var parts = params.value.split("/"); return parts[2]; }, }, { headerName: "Qual ID", field: "id", valueFormatter: function (params) { if (!params.value || params.value === '') return ''; var parts = params.value.split("/"); return parts[2]; } }] }, { headerName: 'More', children: [ { headerName: " ", field: " ", width: 100, columnGroupShow: 'closed' }, { headerName: "Retake", field: "canRetake", width: 100, columnGroupShow: 'open', suppressMenu: true }, { headerName: "hasTest", field: "hasTest", width: 100, columnGroupShow: 'open', suppressMenu: true }, { headerName: "canReq", field: "canRequest", width: 100, columnGroupShow: 'open', suppressMenu: true }, { headerName: "System", field: "isSystem", width: 100, columnGroupShow: 'open', suppressMenu: true }, ] } ], defaultColDef: { sortable: true, filter: true, editable: true, resizable: true, }, rowSelection: 'multiple', animateRows: true, rowData: [] }; window.addEventListener('load', function () { const gridDiv = document.querySelector('#myGrid'); db.quals.toArray().then(data => { var filteredData = data.filter(function (row) { return !row.qualName.includes("Exc: ["); }); gridOptions.rowData = filteredData; new agGrid.Grid(gridDiv, gridOptions); }) }) };