<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
    <front>
        <journal-meta>
            <journal-id journal-id-type="publisher-id">JMIR</journal-id>
            <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
            <journal-title>Journal of Medical Internet Research</journal-title>
            <issn pub-type="epub">1438-8871</issn>
            <publisher>
                <publisher-name>JMIR Publications Inc.</publisher-name>
                <publisher-loc>Toronto, Canada</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="publisher-id">v16i10e233</article-id>
            <article-id pub-id-type="pmid">25356929</article-id>
            <article-id pub-id-type="doi">10.2196/jmir.3807</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Original Paper</subject>
                </subj-group>
                <subj-group subj-group-type="article-type">
                    <subject>Original Paper</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Rapid Grading of Fundus Photographs for Diabetic Retinopathy Using Crowdsourcing</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="editor">
                    <name>
                        <surname>Eysenbach</surname>
                        <given-names>Gunther</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Brabham</surname>
                        <given-names>Daren</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Leontidis</surname>
                        <given-names>Georgios</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="author" id="contrib1" corresp="yes">
                    <name name-style="western">
                        <surname>Brady</surname>
                        <given-names>Christopher J</given-names>
                    </name>
                    <degrees>MD</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <xref rid="aff2" ref-type="aff">2</xref>
                    <address>
                        <institution>Wilmer Eye Institute</institution>
                        <institution>Johns Hopkins University School of Medicine</institution>
                        <addr-line>600 N Wolfe St.</addr-line>
                        <addr-line>Maumenee 711</addr-line>
                        <addr-line>Baltimore, MD, 21287</addr-line>
                        <country>United States</country>
                        <phone>1 (410) 502 2789</phone>
                        <fax>1 (443) 287 8343</fax>
                        <email>brady@jhmi.edu</email>
                    </address>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-7847-3914</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib2">
                    <name name-style="western">
                        <surname>Villanti</surname>
                        <given-names>Andrea C</given-names>
                    </name>
                    <degrees>MPH, PhD</degrees>
                    <xref rid="aff3" ref-type="aff">3</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-3104-966X</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib3">
                    <name name-style="western">
                        <surname>Pearson</surname>
                        <given-names>Jennifer L</given-names>
                    </name>
                    <degrees>MPH, PhD</degrees>
                    <xref rid="aff3" ref-type="aff">3</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-1400-5932</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib4">
                    <name name-style="western">
                        <surname>Kirchner</surname>
                        <given-names>Thomas R</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref rid="aff3" ref-type="aff">3</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-5764-4980</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib5">
                    <name name-style="western">
                        <surname>Gupta</surname>
                        <given-names>Omesh P</given-names>
                    </name>
                    <degrees>MBA, MD</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-4845-0409</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib6">
                    <name name-style="western">
                        <surname>Shah</surname>
                        <given-names>Chirag P</given-names>
                    </name>
                    <degrees>MPH, MD</degrees>
                    <xref rid="aff4" ref-type="aff">4</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-6369-4917</ext-link>
                </contrib>
            </contrib-group>
            <aff id="aff1">
                <sup>1</sup>
                <institution>Wills Eye Hospital</institution>
                <institution>Retina Service: Mid Atlantic Retina</institution>
                <addr-line>Philadelphia, PA</addr-line>
                <country>United States</country>
            </aff>
            <aff id="aff2">
                <sup>2</sup>
                <institution>Wilmer Eye Institute</institution>
                <institution>Johns Hopkins University School of Medicine</institution>
                <addr-line>Baltimore, MD</addr-line>
                <country>United States</country>
            </aff>
            <aff id="aff3">
                <sup>3</sup>
                <institution>Schroeder Institute for Tobacco Research and Policy Studies</institution>
                <institution>Legacy</institution>
                <addr-line>Washington, DC</addr-line>
                <country>United States</country>
            </aff>
            <aff id="aff4">
                <sup>4</sup>
                <institution>Ophthalmic Consultants of Boston</institution>
                <addr-line>Boston, MA</addr-line>
                <country>United States</country>
            </aff>
            <author-notes>
                <corresp>Corresponding Author: Christopher J Brady <email>brady@jhmi.edu</email>
                </corresp>
            </author-notes>
            <pub-date pub-type="collection">
                <month>10</month>
                <year>2014</year>
            </pub-date>
            <pub-date pub-type="epub">
                <day>30</day>
                <month>10</month>
                <year>2014</year>
            </pub-date>
            <volume>16</volume>
            <issue>10</issue>
            <elocation-id>e233</elocation-id>
            <!--history from ojs - api-xml-->
            <history>
                <date date-type="received">
                    <day>25</day>
                    <month>08</month>
                    <year>2014</year>
                </date>
                <date date-type="rev-request">
                    <day>10</day>
                    <month>09</month>
                    <year>2014</year>
                </date>
                <date date-type="rev-recd">
                    <day>15</day>
                    <month>09</month>
                    <year>2014</year>
                </date>
                <date date-type="accepted">
                    <day>16</day>
                    <month>09</month>
                    <year>2014</year>
                </date>
            </history>
            <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
            <copyright-statement>&#169;Christopher J Brady, Andrea C Villanti, Jennifer L Pearson, Thomas R Kirchner, Omesh P Gupta, Chirag P Shah. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 30.10.2014. </copyright-statement>
            <copyright-year>2014</copyright-year>
            <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/2.0/">
                <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
            </license>
            <self-uri xlink:href="http://www.jmir.org/2014/10/e233/" xlink:type="simple" />
            <abstract>
                <sec sec-type="background">
                    <title>Background</title>
                    <p>Screening for diabetic retinopathy is both effective and cost-effective, but rates of screening compliance remain suboptimal. As screening improves, new methods to deal with screening data may help reduce the human resource needs. Crowdsourcing has been used in many contexts to harness distributed human intelligence for the completion of small tasks including image categorization.</p>
                </sec>
                <sec sec-type="objective">
                    <title>Objective</title>
                    <p>Our goal was to develop and validate a novel method for fundus photograph grading.</p>
                </sec>
                <sec sec-type="methods">
                    <title>Methods</title>
                    <p>An interface for fundus photo classification was developed for the Amazon Mechanical Turk crowdsourcing platform. We posted 19 expert-graded images for grading by Turkers, with 10 repetitions per photo for an initial proof-of-concept (Phase I). Turkers were paid US $0.10 per image. In Phase II, one prototypical image from each of the four grading categories received 500 unique Turker interpretations. Fifty draws of 1-50 Turkers were then used to estimate the variance in accuracy derived from randomly drawn samples of increasing crowd size to determine the minimum number of Turkers needed to produce valid results. In Phase III, the interface was modified to attempt to improve Turker grading.</p>
                </sec>
                <sec sec-type="results">
                    <title>Results</title>
                    <p>Across 230 grading instances in the normal versus abnormal arm of Phase I, 187 images (81.3%) were correctly classified by Turkers. Average time to grade each image was 25 seconds, including time to review training images. With the addition of grading categories, time to grade each image increased and percentage of images graded correctly decreased. In Phase II, area under the curve (AUC) of the receiver-operator characteristic (ROC) indicated that sensitivity and specificity were maximized after 7 graders for ratings of normal versus abnormal (AUC=0.98) but was significantly reduced (AUC=0.63) when Turkers were asked to specify the level of severity. With improvements to the interface in Phase III, correctly classified images by the mean Turker grade in four-category grading increased to a maximum of 52.6% (10/19 images) from 26.3% (5/19 images). Throughout all trials, 100% sensitivity for normal versus abnormal was maintained.</p>
                </sec>
                <sec sec-type="conclusions">
                    <title>Conclusions</title>
                    <p>With minimal training, the Amazon Mechanical Turk workforce can rapidly and correctly categorize fundus photos of diabetic patients as normal or abnormal, though further refinement of the methodology is needed to improve Turker ratings of the degree of retinopathy. Images were interpreted for a total cost of US $1.10 per eye. Crowdsourcing may offer a novel and inexpensive means to reduce the skilled grader burden and increase screening for diabetic retinopathy.</p>
                </sec>
            </abstract>
            <kwd-group>
                <kwd>diabetic retinopathy</kwd>
                <kwd>telemedicine</kwd>
                <kwd>fundus photography</kwd>
                <kwd>crowdsourcing</kwd>
                <kwd>Amazon Mechanical Turk</kwd>
            </kwd-group>
        </article-meta>
    </front>
    <body>
        <sec sec-type="introduction">
            <title>Introduction</title>
            <p>Since early diabetic retinopathy (DR) is often asymptomatic, detection of disease at this stage is either incidental or by deliberate screening. Screening for DR is both effective and cost-effective [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref4">4</xref>], but adherence rates to published guidelines for screening for DR are low, with only 35-60% of diabetic patients receiving an annual dilated fundus examination in the United States [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. As a way to increase adherence, telehealth screening using non-mydriatic fundus photography and remote interpretation is increasing, especially in rural and remote settings [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. Early diagnosis of DR and institution of appropriate therapy represents an enormous opportunity to prevent vision loss in a young, working-age demographic [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. Telehealth, in particular, may be a way to control provider, payer, and societal costs.</p>
            <p>Among the costs of a telehealth program are the fundus camera, the telehealth software package, and the human resources needed for image acquisition and interpretation. Fundus photo interpretation costs in diabetic retinopathy screening may be high given the labor-intensive interpretation protocols and the need to interpret multiple images per patient. Computerized, semi-automated image analysis techniques have been developed that may be able to reduce physician workload and screening costs [<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref14">14</xref>]; however, these methods are not FDA-approved, nor in wide use clinically at this time. If telehealth continues to expand, low-cost methods will be needed to interpret the large volume of fundus images expected with rising incidence of diabetes, especially in resource-poor settings and in large public health screenings.</p>
            <p>Crowdsourcing is defined by Brabham as &#8220;an online, distributed problem-solving and production model that leverages the collective intelligence of online communities to serve specific organizational goals&#8221; [<xref ref-type="bibr" rid="ref15">15</xref>]. A subset of crowdsourcing, which he terms &#8220;distributed-human-intelligence tasking&#8221;, can involve subdividing larger tasks into small portions and then recruiting a group of individuals to each complete these small portions, and only collectively, the entire task [<xref ref-type="bibr" rid="ref15">15</xref>]. The use of crowdsourcing in biomedical research is in its infancy, though some groups have used this method in public health research [<xref ref-type="bibr" rid="ref16">16</xref>] and to interpret medical imaging. For example, malaria researchers have used a Web-based game to recruit untrained, anonymous volunteers to&#160;tag and count malaria parasites on digital images of blood smears [<xref ref-type="bibr" rid="ref17">17</xref>]. The investigators showed that by combining the analyses of&#160;several users, they were able to&#160;achieve similar accuracy rates to expert microscopists. Crowdsourcing has recently been used to categorize a number of fundus photos with a variety of diagnoses as normal or abnormal [<xref ref-type="bibr" rid="ref18">18</xref>]. In a trial conducted in the United Kingdom using untrained graders, the sensitivity was &#8805;96% for normal versus severely abnormal and between 61-79% for normal versus mildly abnormal [<xref ref-type="bibr" rid="ref18">18</xref>].</p>
            <p>The current research uses diabetic retinopathy as the test condition to explore whether a crowdsourcing interface can be used to train workers to classify human fundus photos as normal or abnormal and subsequently conduct diagnostic grading of images [<xref ref-type="bibr" rid="ref19">19</xref>]. This project estimates the validity and reliability of crowdsourced grading of images for diabetic retinopathy, compared to the criterion standard of expert grading. Our hypothesis is that crowdsourced grading of fundus photography interpretation can be rapid, accurate, and reliable in the screening for diabetic retinopathy.</p>
        </sec>
        <sec sec-type="methods">
            <title>Methods</title>
            <sec>
                <title>Crowdsourcing</title>
                <p>An interface for fundus photo classification was developed for the Amazon Mechanical Turk (AMT [<xref ref-type="bibr" rid="ref20">20</xref>]) crowdsourcing platform (<xref ref-type="fig" rid="figure1">Figure 1</xref>). AMT is an online labor market that allows access to thousands of people who can quickly accomplish small, discrete tasks for small amounts of money. Typical AMT tasks include tagging photos, translating words, or writing very short articles for websites. AMT has also been used to annotate photos of the tobacco point-of-sale retail environment [<xref ref-type="bibr" rid="ref21">21</xref>], evaluate oral health promotion materials [<xref ref-type="bibr" rid="ref22">22</xref>], investigate the relationship between depression and stigma [<xref ref-type="bibr" rid="ref23">23</xref>], assess people&#8217;s reactions to frightening anti-smoking campaigns [<xref ref-type="bibr" rid="ref24">24</xref>], and evaluate public awareness of ovarian cancer [<xref ref-type="bibr" rid="ref25">25</xref>], among many other research-orientated applications [<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref28">28</xref>]. Amazon Mechanical Turk has its own vocabulary used by AMT workers (Turkers) and AMT task administrators (Requestors). A Human Intelligence Task (HIT) is a small job that may be performed in a matter of seconds or minutes and, once the work is approved by the requestor, may pay US $0.01-$0.25 or more per task depending on the complexity of the HIT. A group of HITs is called a &#8220;batch&#8221; and is made up of similar HITs. Depending on the complexity of the task and the payment offered by the Requestor, a batch is often completed within minutes or hours of posting.</p>
                <p>AMT is a reputation-based economy such that Turkers may only access the most desirable HITs once they have a sufficient track record of previously accepted work [<xref ref-type="bibr" rid="ref29">29</xref>]. High quality Turkers may avoid a new Requestor&#8217;s HITs until the Requestor has demonstrated his or her own fairness in approving and rejecting work. Indeed, a Turker&#8217;s reputation will suffer following rejection of even a small number of HITs. AMT is a complex ecosystem in which both high-quality work on the part of the Turkers and fairness on the part of the Requestor are rewarded.</p>
                <p>Turkers perform their work anonymously, but demographic studies have been conducted. In a survey of 1000 Turkers, Ipeirotis found that 46.8% of Turkers are located in the United States, 34% are in India, and the remaining 19.2% were from 64 other countries [<xref ref-type="bibr" rid="ref30">30</xref>]. The majority of workers in the United States were women, most of whom reported AMT as a source of supplemental income, whereas in the majority of workers in India were men, and reported AMT as their primary source of income. Across nations, Turkers were younger and better educated than the general population [<xref ref-type="bibr" rid="ref30">30</xref>].</p>
                <fig id="figure1" position="float">
                    <label>Figure 1</label>
                    <caption>
                        <p>Screenshot of the Amazon Mechanical Turk Web interface for fundus photo grading.</p>
                    </caption>
                    <graphic xlink:href="jmir_v16i10e233_fig1.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>Design</title>
                <p>For the current study, the United Kingdom national screening program grading scale [<xref ref-type="bibr" rid="ref31">31</xref>] was used by 2 attending retinal surgeons (OPG, CPS) to categorize 19 anonymized teaching images. The same AMT interface and resolution of images used by the Turkers was used by the expert graders. Consensus was reached by discussion on images for which there was disagreement. For the purposes of the study, terms from the UK grading scale were translated into plain language: &#8220;background&#8221; retinopathy was called &#8220;mild&#8221;, &#8220;preproliferative&#8221; was called &#8220;moderate&#8221;, and &#8220;proliferative&#8221; was called &#8220;severe&#8221;. &#8220;Maculopathy&#8221; was defined as abnormal on a training image with otherwise moderate disease but was not coded separately. The AMT interface was designed to provide training on grading of DR within each HIT. This training included 6 images annotated with the salient features of each level of retinopathy in plain language. Turkers were presented with the following text: &#8220;This is a photo of the inside of the eye. We are looking to label eyes as healthy or unhealthy with respect to diabetes. Rate this eye.&#8221; Turkers could hover their mouse over 6 adjacent training images (1 normal, 1 mild, 1 moderate, 3 severe) while reviewing the active test image. This layout allowed for all of the training and grading to occur in one browser window. More examples of proliferative/severe disease were provided due to the heterogeneity of findings constituting this level of disease. There were no restrictions on the type of device or display/monitor used by Turkers to complete the task.</p>
            </sec>
            <sec>
                <title>Phase I</title>
                <p>In the first phase of the study, the 19 images were posted to AMT for grading by Turkers, with 10 repetitions per photo for an initial proof-of-concept. Four photos were re-posted with this initial batch for 10 repetitions to assess intragrader reliability. Turkers were paid US $0.10 per image, and a 10% commission was paid to Amazon. In order to be eligible to view and complete the HITs, Turkers needed to have successfully completed 100 prior HITs and have an overall HIT approval rate of 97%.</p>
                <p>In the initial batch, HITs were posted asking Turkers to grade images as normal (0) versus abnormal (1). In subsequent batches, Turkers were asked to grade the same 19 images using three categories (normal=0, mild to moderate=1, and severe=2) and then four categories (normal=0, mild=1, moderate=2, and severe=3). Percentage of images correctly classified was calculated. Sensitivity and specificity were calculated for all batches, collapsing all abnormal categories together for three- and four-category grading tasks using Stata 13. A worker consensus grade was assigned to each image based on the mode of the 10 Turker scores. Consensus grade using the mean of the 10 Turker scores was also calculated on an exploratory basis. For the two category tasks, a mean score &#60;0.50 was defined as normal, and &#8805;0.50 was abnormal. For the three category tasks, &#60;0.50 was defined as normal, &#8805;0.5 to &#60;1.5 was defined as mild to moderate, and &#8805;1.5 was defined as severe. In the four category tasks, &#60;0.50 was defined as normal, &#8805;0.5 to &#60;1.5 was defined as mild, &#8805;1.5 to &#60;2.5 was defined as moderate, and &#8805;2.5 was defined as severe.</p>
            </sec>
            <sec>
                <title>Phase II</title>
                <p>The purpose of Phase II was two-fold. First, Phase II sought to evaluate the emergent ability of the crowd to accurately distinguish between different levels of retinopathy, based on the idea that larger numbers of raters would increasingly coalesce around the correct answer. Second, Phase II sought to identify and ultimately confirm the threshold beyond which the contribution of one more rater would cease to provide additional information. To accomplish this, one prototypical image from each of the four grading categories was submitted to undergo 500 unique Turker interpretations. Jackknife resampling methods were then used to draw random subsamples from this &#8220;population&#8221; of 500 Turkers, beginning with 50 random samples of 2 Turkers, then 50 random samples of 3 Turkers, and so forth [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. This made it possible to estimate the variance in accuracy derived from each randomly drawn sample of raters at each crowd size and to compute area under the curve (AUC) of the receiver-operator characteristic (ROC) curve, indicating their performance relative to the expert grading.</p>
            </sec>
            <sec>
                <title>Phase III</title>
                <p>In Phase III of the study, three additional iterative batches of the 19 images were run in an effort to improve Turker grading using the four diagnostic categories. The first batch used Turker feedback from all previous batches to modify the training image set. The second batch used more stringent criteria for Turkers in addition to the modified training images. A minimum of 500 completed and approved HITs was required as was an overall HIT approval rate of 99%. The third batch was conducted using Turkers holding an Amazon designation of &#8220;Photo Moderation Master&#8221; and raised the compensation to US $0.15 per image, in addition to the changes made for batches 1 and 2. The criteria necessary to achieve this designation are not published, but Masters are &#8220;elite groups of Workers who have demonstrated accuracy on specific types of HITs on the Mechanical Turk marketplace. Workers achieve a Masters distinction by consistently completing HITs of a certain type with a high degree of accuracy across a variety of Requesters&#8221; [<xref ref-type="bibr" rid="ref33">33</xref>]. As in Phase I, percent correctly classified, worker consensus score, and average time to complete the HITs were estimated for these three iterative batches.</p>
                <p>The Wills Eye Institute Institutional Review Board ruled that approval was not required for this study.</p>
            </sec>
        </sec>
        <sec sec-type="results">
            <title>Results</title>
            <sec>
                <title>Phase I</title>
                <p>Two expert graders (OPG, CPS) coded 12 images as abnormal and 7 as normal (<xref ref-type="table" rid="table1">Table 1</xref>). Each of the three Phase I batches consisted of 23 photos (19 unique, 4 duplicates) with 10 unique graders for a total of 230 grading instances. Time-to-complete Turker grading of images varied with the number of grading categories. Two category (normal/abnormal) grading was completed in 20 minutes, three-category grading in 3 hours, and four-category grading in 2 hours. Because the images were interpreted rapidly and workers could complete as many or as few of the HITs as desired, most of the four duplicate images were rated by unique Turkers and therefore, we were unable to assess intragrader reliability.</p>
                <p>Across 230 grading instances of unique images in the two-category HITs (normal vs. abnormal) of Phase I, 187 (81.3%) of the images were correctly classified by Turkers (<xref ref-type="table" rid="table1">Table 1</xref>). Sensitivity and specificity were 93.6% and 67.8% respectively using individual Turker scores. Sensitivity and specificity were 100% and 71.4% respectively using Turker consensus scores. Average time to grade each image was 25 seconds, including time to review training images. At US $0.11 per grading, each image was graded for $1.10, and grading garnered an effective hourly wage of $14.31 (<xref ref-type="table" rid="table2">Table 2</xref>).</p>
                <p>Overall number of correctly classified images decreased with the addition of a third and fourth grading category to 64.4% (148/230) and 50.9% (117/230), respectively. Specificity and specificity for individual Turkers was 96.3% and 66.7% respectively for both three and four categories. At the level of Turker consensus, sensitivity was 100% for both three and four categories, and specificity was 71.4% and 100% for three and four categories, respectively. With additional grading criteria, the speed of grading decreased, as did the effective hourly wage. Average time to complete the three-category HITs was 51 seconds, for an effective hourly wage of $7.08. Average time to complete the four-category HITs was 55 seconds, for an effective hourly wage of $6.60 (<xref ref-type="table" rid="table2">Table 2</xref>).</p>
                <table-wrap position="float" id="table1">
                    <label>Table 1</label>
                    <caption>
                        <p>Turker grading of individual images<sup>a</sup>.</p>
                    </caption>
                    <table width="1000" border="0" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="75" />
                        <col width="40" />
                        <col width="60" />
                        <col width="60" />
                        <col width="40" />
                        <col width="60" />
                        <col width="60" />
                        <col width="40" />
                        <col width="60" />
                        <col width="60" />
                        <thead>
                            <tr valign="top">
                                <td>Image #</td>
                                <td colspan="3">Two-category rating</td>
                                <td colspan="3">Three-category rating</td>
                                <td colspan="3">Four-category rating</td>
                            </tr>
                            <tr valign="bottom">
                                <td>
                                    <break />
                                </td>
                                <td>Expert <break /> rating</td>
                                <td>Correct <break /> diagnosis<sup>b</sup>, %</td>
                                <td>Turker <break /> consensus<sup>c</sup>
                                </td>
                                <td>Expert <break /> rating</td>
                                <td>Correct <break /> diagnosis<sup>b</sup>, %</td>
                                <td>Turker <break /> consensus<sup>c</sup>
                                </td>
                                <td>Expert <break /> rating</td>
                                <td>Correct <break /> diagnosis<sup>b</sup>, %</td>
                                <td>Turker <break /> consensus<sup>c</sup>
                                </td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>1</td>
                                <td>Nor</td>
                                <td>65</td>
                                <td>&#8212;</td>
                                <td>Nor</td>
                                <td>90</td>
                                <td>&#8212;</td>
                                <td>Nor</td>
                                <td>55</td>
                                <td>&#8212;</td>
                            </tr>
                            <tr valign="top">
                                <td>2</td>
                                <td>Ab</td>
                                <td>85</td>
                                <td>&#8212;</td>
                                <td>M/M</td>
                                <td>50</td>
                                <td>Sev</td>
                                <td>Mild</td>
                                <td>0</td>
                                <td>Sev</td>
                            </tr>
                            <tr valign="top">
                                <td>3</td>
                                <td>Nor</td>
                                <td>70</td>
                                <td>&#8212;</td>
                                <td>Nor</td>
                                <td>70</td>
                                <td>&#8212;</td>
                                <td>Nor</td>
                                <td>70</td>
                                <td>&#8212;</td>
                            </tr>
                            <tr valign="top">
                                <td>4</td>
                                <td>Nor</td>
                                <td>50</td>
                                <td>Ab</td>
                                <td>Nor</td>
                                <td>40</td>
                                <td>M/M</td>
                                <td>Nor</td>
                                <td>60</td>
                                <td>&#8212;</td>
                            </tr>
                            <tr valign="top">
                                <td>5</td>
                                <td>Nor</td>
                                <td>80</td>
                                <td>&#8212;</td>
                                <td>Nor</td>
                                <td>70</td>
                                <td>&#8212;</td>
                                <td>Nor</td>
                                <td>50</td>
                                <td>&#8212;</td>
                            </tr>
                            <tr valign="top">
                                <td>6</td>
                                <td>Ab</td>
                                <td>100</td>
                                <td>&#8212;</td>
                                <td>M/M</td>
                                <td>90</td>
                                <td>&#8212;</td>
                                <td>Mild</td>
                                <td>20</td>
                                <td>Mod</td>
                            </tr>
                            <tr valign="top">
                                <td>7</td>
                                <td>Ab</td>
                                <td>90</td>
                                <td>&#8212;</td>
                                <td>Severe</td>
                                <td>60</td>
                                <td>&#8212;</td>
                                <td>Sev</td>
                                <td>10</td>
                                <td>Mod</td>
                            </tr>
                            <tr valign="top">
                                <td>8</td>
                                <td>Nor</td>
                                <td>50</td>
                                <td>Ab</td>
                                <td>Sev</td>
                                <td>40</td>
                                <td>M/M</td>
                                <td>Nor</td>
                                <td>65</td>
                                <td>&#8212;</td>
                            </tr>
                            <tr valign="top">
                                <td>9</td>
                                <td>Ab</td>
                                <td>100</td>
                                <td>&#8212;</td>
                                <td>Sev</td>
                                <td>95</td>
                                <td>&#8212;</td>
                                <td>Sev</td>
                                <td>100</td>
                                <td>&#8212;</td>
                            </tr>
                            <tr valign="top">
                                <td>10</td>
                                <td>Ab</td>
                                <td>100</td>
                                <td>&#8212;</td>
                                <td>Sev</td>
                                <td>40</td>
                                <td>M/M</td>
                                <td>Sev</td>
                                <td>70</td>
                                <td>&#8212;</td>
                            </tr>
                            <tr valign="top">
                                <td>11</td>
                                <td>Ab</td>
                                <td>90</td>
                                <td>&#8212;</td>
                                <td>Sev</td>
                                <td>0</td>
                                <td>M/M</td>
                                <td>Sev</td>
                                <td>20</td>
                                <td>Mild</td>
                            </tr>
                            <tr valign="top">
                                <td>12</td>
                                <td>Nor</td>
                                <td>90</td>
                                <td>&#8212;</td>
                                <td>Nor</td>
                                <td>80</td>
                                <td>&#8212;</td>
                                <td>Nor</td>
                                <td>90</td>
                                <td>&#8212;</td>
                            </tr>
                            <tr valign="top">
                                <td>13</td>
                                <td>Ab</td>
                                <td>100</td>
                                <td>&#8212;</td>
                                <td>M/M</td>
                                <td>30</td>
                                <td>Sev</td>
                                <td>Mod</td>
                                <td>20</td>
                                <td>Sev</td>
                            </tr>
                            <tr valign="top">
                                <td>14</td>
                                <td>Ab</td>
                                <td>80</td>
                                <td>&#8212;</td>
                                <td>Sev</td>
                                <td>40</td>
                                <td>M/M</td>
                                <td>Sev</td>
                                <td>10</td>
                                <td>Mod</td>
                            </tr>
                            <tr valign="top">
                                <td>15</td>
                                <td>Nor</td>
                                <td>90</td>
                                <td>&#8212;</td>
                                <td>Nor</td>
                                <td>100</td>
                                <td>&#8212;</td>
                                <td>Nor</td>
                                <td>90</td>
                                <td>&#8212;</td>
                            </tr>
                            <tr valign="top">
                                <td>16</td>
                                <td>Ab</td>
                                <td>90</td>
                                <td>&#8212;</td>
                                <td>Sev</td>
                                <td>70</td>
                                <td>&#8212;</td>
                                <td>Sev</td>
                                <td>50</td>
                                <td>&#8212;</td>
                            </tr>
                            <tr valign="top">
                                <td>17</td>
                                <td>Ab</td>
                                <td>100</td>
                                <td>&#8212;</td>
                                <td>M/M</td>
                                <td>60</td>
                                <td>&#8212;</td>
                                <td>Mild</td>
                                <td>10</td>
                                <td>Mod</td>
                            </tr>
                            <tr valign="top">
                                <td>18</td>
                                <td>Ab</td>
                                <td>100</td>
                                <td>&#8212;</td>
                                <td>M/M</td>
                                <td>100</td>
                                <td>&#8212;</td>
                                <td>Mod</td>
                                <td>95</td>
                                <td>&#8212;</td>
                            </tr>
                            <tr valign="top">
                                <td>19</td>
                                <td>Ab</td>
                                <td>90</td>
                                <td>&#8212;</td>
                                <td>M/M</td>
                                <td>80</td>
                                <td>&#8212;</td>
                                <td>Mild</td>
                                <td>20</td>
                                <td>Mod</td>
                            </tr>
                            <tr valign="top">
                                <td>Correct, %</td>
                                <td>&#160;</td>
                                <td>81.3</td>
                                <td>89.5</td>
                                <td>
                                    <break />
                                </td>
                                <td>64.4</td>
                                <td>63.2</td>
                                <td>&#160;</td>
                                <td>50.9</td>
                                <td>57.9</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Sensitivity<sup>d</sup>, %</td>
                                <td>&#160;</td>
                                <td>93.6</td>
                                <td>100.0</td>
                                <td>
                                    <break />
                                </td>
                                <td>96.3</td>
                                <td>100.0</td>
                                <td>&#160;</td>
                                <td>96.3</td>
                                <td>100.0</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Specificity<sup>d</sup>, %</td>
                                <td>&#160;</td>
                                <td>67.8</td>
                                <td>71.4</td>
                                <td>&#160;</td>
                                <td>66.7</td>
                                <td>71.4</td>
                                <td>&#160;</td>
                                <td>66.7</td>
                                <td>100.0</td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <fn id="table1fn1">
                            <p>
                                <sup>a</sup>Nor=Normal; Ab=Abnormal; M/M=Mild or Moderate; Sev=Severe; Mod=Moderate.</p>
                        </fn>
                        <fn id="table1fn2">
                            <p>
                                <sup>b</sup>At the level of the individual graders.</p>
                        </fn>
                        <fn id="table1fn3">
                            <p>
                                <sup>c</sup>Consensus rating presented only if it differed from the expert rating.</p>
                        </fn>
                        <fn id="table1fn4">
                            <p>
                                <sup>d</sup>Calculated for normal versus any disease level.</p>
                        </fn>
                    </table-wrap-foot>
                </table-wrap>
                <table-wrap position="float" id="table2">
                    <label>Table 2</label>
                    <caption>
                        <p>Time to complete ratings (in seconds).</p>
                    </caption>
                    <table width="1000" border="0" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="107" />
                        <col width="62" />
                        <col width="68" />
                        <col width="62" />
                        <col width="94" />
                        <col width="96" />
                        <col width="89" />
                        <thead>
                            <tr valign="bottom">
                                <td>&#160;</td>
                                <td>Two-category rating</td>
                                <td>Three-category rating</td>
                                <td>Four-category rating</td>
                                <td>Four-category rating (improved training)</td>
                                <td>Four-category rating (increased approval)</td>
                                <td>Four-category rating (Master Graders)<sup>a</sup>
                                </td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Mean time per HITs</td>
                                <td>25.16</td>
                                <td>50.87</td>
                                <td>54.52</td>
                                <td>50.98</td>
                                <td>38.79</td>
                                <td>44.14</td>
                            </tr>
                            <tr valign="top">
                                <td>95% CI</td>
                                <td>21.93-28.38</td>
                                <td>43.18-58.55</td>
                                <td>46.15-62.88</td>
                                <td>39.66-62.30</td>
                                <td>31.65-45.93</td>
                                <td>36.00-52.27</td>
                            </tr>
                            <tr valign="top">
                                <td>Hourly wage, $</td>
                                <td>14.31</td>
                                <td>7.08</td>
                                <td>6.60</td>
                                <td>7.06</td>
                                <td>9.28</td>
                                <td>12.23</td>
                            </tr>
                            <tr valign="top">
                                <td>Cost per image, $</td>
                                <td>1.10</td>
                                <td>1.10</td>
                                <td>1.10</td>
                                <td>1.10</td>
                                <td>1.10</td>
                                <td>1.95</td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <fn id="table2fn1">
                            <p>
                                <sup>a</sup>Master graders received US $0.15 per image, plus a 30% Amazon commission for a total cost of US $0.195/image.</p>
                        </fn>
                    </table-wrap-foot>
                </table-wrap>
            </sec>
            <sec>
                <title>Phase II</title>
                <p>Results of Phase II likewise indicate that sensitivity and specificity for overall ratings of abnormal versus normal was excellent, producing a highly significant AUC (0.98; <xref ref-type="fig" rid="figure2">Figure 2</xref>, Panel D). Turkers were not as accurate when asked to differentiate among four severity levels. Post hoc contrast analyses, however, indicate that Turkers performed well when asked to identify the abnormalities that were moderate in severity (ROC=0.85; <xref ref-type="fig" rid="figure2">Figure 2</xref>, Panel B). The pattern of results indicates that lower accuracy identifying mild (ROC=0.57; <xref ref-type="fig" rid="figure2">Figure 2</xref>, Panel A) and severe (AUC=0.73; <xref ref-type="fig" rid="figure2">Figure 2</xref>, Panel C) abnormalities was due to a tendency to rate all abnormalities as moderate in severity, rather than a failure to recognize normal versus mild and severe abnormalities more generally. Results also indicate that maximum AUC was usually achieved when crowd size reached a total of between 7 and 10 Turkers, confirming the validity of the crowd sizes used to rate the larger set of images (<xref ref-type="fig" rid="figure2">Figure 2</xref>). This affirms that the results of Phases I and III would not have been different had we sought a larger number of Turkers for each HIT.</p>
                <fig id="figure2" position="float">
                    <label>Figure 2</label>
                    <caption>
                        <p>Area under the curve (AUC) of the receiver-operator characteristic (ROC) curve for increasing numbers of Turker interpretations of a prototypical image from each severity level. Turkers had low accuracy for the Mild (Panel A) and Severe image (Panel C), but acceptable accuracy for the Moderate image (Panel B). When all four images were analyzed for absence or presence of disease only, Turkers performed well (Panel D) with a highly significant AUC.</p>
                    </caption>
                    <graphic xlink:href="jmir_v16i10e233_fig2.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>Phase III</title>
                <p>In Phase III, an additional normal training image was added due to Turkers&#8217; interpreting visible choroidal vessels as abnormal during Phase I. The annotations were clarified to indicate that the presence of a single microaneurysm is considered abnormal and that hard exudates need not be present to achieve moderate or severe disease. Functionality to enlarge the image being graded was added. In the first batch using the new training, the percentage of correctly classified images using the consensus Turker scores was no better than previous: 42.1% (8/19 images) versus 57.9% (11/19 images), respectively by mode and 21.1% (4/19 images) versus 26.3% (5/19 images) by mean. In the second batch, with more stringent criteria for Turker selection, the proportion of correctly graded images improved to 52.6% (10/19 images) by mean (mode unchanged). This result was confirmed in a repeat run of this exact batch (data not shown). In the third batch, using &#8220;Photo Moderation Masters&#8221;, the proportion of correctly graded images decreased to 36.8% (7/19 images) by mean (mode unchanged). Throughout all batches, the diagnostic sensitivity for any level of disease was maintained at 100% (<xref ref-type="table" rid="table3">Table 3</xref>)</p>
                <table-wrap position="float" id="table3">
                    <label>Table 3</label>
                    <caption>
                        <p>Turker consensus in Phase III.</p>
                    </caption>
                    <table width="680" border="0" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="213" />
                        <col width="90" />
                        <col width="52" />
                        <col width="52" />
                        <col width="52" />
                        <col width="62" />
                        <col width="62" />
                        <thead>
                            <tr valign="bottom">
                                <td>&#160;</td>
                                <td>Number correct (mean)<sup>a</sup>
                                </td>
                                <td>% correct (mean)</td>
                                <td>Number correct (mode)<sup>a</sup>
                                </td>
                                <td>% correct (mode)</td>
                                <td>Sensitivity<sup>b</sup>
                                </td>
                                <td>Specificity<sup>b</sup>
                                </td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Phase I: Four-category rating</td>
                                <td>5</td>
                                <td>26.3</td>
                                <td>11</td>
                                <td>57.9</td>
                                <td>100.0</td>
                                <td>100.0</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Phase 3: Trial 1 (improved training)</td>
                                <td>4</td>
                                <td>21.1<sup>c</sup>
                                </td>
                                <td>8<sup>d</sup>
                                </td>
                                <td>42.1</td>
                                <td>100.0</td>
                                <td>57.1</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Phase 3: Trial 2 (raised approval rating)</td>
                                <td>10</td>
                                <td>52.6</td>
                                <td>11<sup>e</sup>
                                </td>
                                <td>57.9</td>
                                <td>100.0</td>
                                <td>100.0</td>
                            </tr>
                            <tr valign="top">
                                <td>Phase 3: Trial 3 (Master Graders)</td>
                                <td>7</td>
                                <td>36.8</td>
                                <td>11</td>
                                <td>57.9</td>
                                <td>100.0</td>
                                <td>100.0</td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <fn id="table3fn1">
                            <p>
                                <sup>a</sup>Calculated by level (eg, Turker consensus matches expert designation as normal, mild, moderate, and severe).</p>
                        </fn>
                        <fn id="table3fn2">
                            <p>
                                <sup>b</sup>Calculated for normal versus any disease level using the mode consensus score.</p>
                        </fn>
                        <fn id="table3fn3">
                            <p>
                                <sup>c</sup>After excluding a single Turker with systematically higher scores, 42.1% correct.</p>
                        </fn>
                        <fn id="table3fn4">
                            <p>
                                <sup>d</sup>Three images had no mode and were considered incorrect for &#8220;Number Correct&#8221; and &#8220;% correct&#8221; but recoded as abnormal for sensitivity and specificity.</p>
                        </fn>
                        <fn id="table3fn5">
                            <p>
                                <sup>e</sup>One image had no mode and was considered incorrect for &#8220;Number Correct&#8221; and &#8220;% correct&#8221; but recoded as abnormal for sensitivity and specificity.</p>
                        </fn>
                    </table-wrap-foot>
                </table-wrap>
            </sec>
        </sec>
        <sec sec-type="discussion">
            <title>Discussion</title>
            <sec>
                <title>Principal Findings</title>
                <p>With minimal training, an anonymous, untrained workforce recruited through a public crowdsourcing platform can rapidly and correctly categorize fundus photos of diabetic patients as normal or abnormal. The Turkers in this study graded these images with a high sensitivity, which is ideal for a screening instrument. Critically, no false negative consensus results were generated in any of our batches, indicating that no cases of DR were missed. When asked to categorize photos by degree of retinopathy, Turkers improved with changes in the Turk interface, particularly with increasing prior approval rating needed to perform the HITs. The number of graders required to reach a reliable &#8220;consensus grade&#8221; was consistent across categories, and 10 grading instances per image was established as sufficient for valid results.</p>
                <p>Images were interpreted for a total cost of US $1.10 per eye. While abnormal images would still currently still require further evaluation to identify patients in need of a live examination, this cost is near the limit suggested by some investigators for feasible public health screening in developing economies [<xref ref-type="bibr" rid="ref34">34</xref>]. Indeed, the reimbursement per image, which ranged from an effective hourly wage of US $6.60 to $14.31 in our study, could possibly be reduced, since a reasonable target hourly wage for AMT workers is the federal minimum wage of US $7.25 per hour or even lower [<xref ref-type="bibr" rid="ref35">35</xref>]. Additionally, posting larger batches of images might allow for lower per image reimbursement, since Turker speed would likely increase after becoming more skilled at the task, allowing them to maintain the same effective wage. While there may not be a direct relationship between quality responses and high wages [<xref ref-type="bibr" rid="ref36">36</xref>], there may be a link between high wages and rapid completion of image grading, so it may not be wise to dramatically reduce reimbursement.</p>
                <p>A post hoc analysis of individual Turkers&#8217; scores revealed inconsistent use of the four grading categories by one Turker in the first batch of Phase 3 (<xref ref-type="table" rid="table3">Table 3</xref>). Several issues are brought to light by considering this specific batch. First, inconsistent use of all categories was a rare occurrence, demonstrating that Turkers are conscientious workers. This was also evident from comments made by Turkers as they completed HITs, which included thoughtful suggestions for improvement to the interface and concern over HITs that were felt to be ambiguous. Second, using the mean of crowdsourced responses may generate outputs that are rather sensitive to outliers. For this reason, using the mode to calculate consensus is generally preferable, though some images may not have a pure mode (<xref ref-type="table" rid="table3">Table 3</xref>), in which case the higher score of any &#8220;tie&#8221; would be used clinically. Third, and more broadly, AMT may be susceptible to Turker accounts that attempt to take advantage of the system by rapidly completing HITs with random responses either with live individuals or with automated programs or &#8220;bots&#8221; [<xref ref-type="bibr" rid="ref29">29</xref>]. Moving forward, it may be necessary to analyze raw Turker scores for such phenomena and perhaps develop methods to exclude systematically unreliable scores.</p>
                <p>Since AMT is a reputation-based economy, Requestors can reject or block Turkers who are not performing appropriately. Both actions negatively impact the Turkers&#8217; reputation, which in turn affects their ability to perform HITs in the future, so there is a strong incentive to perform tasks accurately and honestly. This is likely why increasing the prior HIT approval rating to 99% had the most dramatic impact on consensus accuracy. Adding the &#8220;Photo Moderation Master&#8221; qualification did not improve worker consensus. This may be due to the fact that the criteria Amazon uses to grant this qualification are not relevant to our task. Additionally, since only a fraction of Turkers have the qualification, requiring it reduces the available workforce, which can increase the time required to complete batches. Especially when factoring in the additional Amazon commission, use of the Master qualification may not be necessary or cost-effective for these types of tasks in the future.</p>
                <p>The current study was limited to a small set of hand-picked, high-quality, mydriatic fundus photos chosen to illustrate the key findings in diabetic retinopathy. Screening populations might have a subset of low-quality or uninterpretable images and would also be expected to have far more images of normal fundi. Identifying pathology in such sets would require extra vigilance on the part of Turkers to detect mild disease within large groups of normal photos. Larger datasets with more subtle pathology need to be tested with this methodology. Additionally, analyzing whether iterative improvements to the interface lead to better results is confounded by the fact that Turkers may have previously been exposed to the task and may be improving in their grading through practice. This is unlikely because the Turkers receive no feedback on their grading, so they do not know if they have correctly graded images or not. Moreover, while it is not currently feasible to &#8220;block&#8221; Turkers who have previously completed any of our HITs, it is possible to view their grading history within the project. Surprisingly, throughout all batches posted, most of our HITs were completed by Turkers otherwise na&#239;ve to our project. In the final batch of 190 HITs posted for this project, after approximately 3000 HITs using the same images had been posted, 170 (89.5%) were completed by Turkers who had never done any of our HITs before, and 20 HITs were done by 3 individual Turkers who had each graded only four images previously (data not shown). In future larger batches, adjusting for individual graders&#8217; improvement over time could become necessary.</p>
            </sec>
            <sec>
                <title>Future Considerations</title>
                <p>While further refinement of the methodology is still needed to resolve the degree of retinopathy, the current model could possibly be used as a way to reduce the burden on skilled graders by eliminating most of the normal images in very large screenings and passing only those abnormal images on for further characterization. While the individuals who complete HITs on AMT are truly anonymous, they do have unique numerical identifiers and can be tracked across HITs and batches of HITs. Therefore, an intriguing possibility using a crowdsourcing interface could include developing a cadre of specific Turkers who demonstrate a track record of reliable grading. These graders might be capable of a higher level of categorization than the general pool of Turkers and could be recruited for more complex grading tasks. Additionally, it is likely that automated computer algorithms will also play a role in the analysis of fundus images for DR and other conditions in the future. This raises the possibility of an even more robust interaction between artificial intelligence and human intelligence. Images could be graded in a tiered fashion by one system, and then those graded ambiguously could be routed to the other for further validation.</p>
                <p>An unanticipated benefit of such a crowdsourcing program is that it might raise awareness of diabetes and diabetic retinopathy. Since our interface allowed Turkers to leave feedback for us to refine the instrument, we were able to capture comments such as, &#8220;I have learn about diabetes little bit [sic]&#8221;, &#8220;I really liked seeing the pics of the eye, very interesting&#8221;, and &#8220;This HIT was very good and a nice break from all of the bubbling surveys. Thank you!&#8221;, suggesting an interest in the subject matter beyond other HITs and beyond what we had expected at the outset. This finding is consistent with what has been termed &#8220;Virtual Citizen Science&#8221; in fields outside of biomedical research [<xref ref-type="bibr" rid="ref37">37</xref>].</p>
            </sec>
            <sec>
                <title>Conclusions</title>
                <p>Crowdsourcing represents a novel and inexpensive means to rapidly identify diabetic retinopathy. Further refinements of the technique are required, as is external validation with larger image sets. Additionally, multiple medico-legal and ethical issues would need to be addressed prior to clinical use of this technology, but there may be a role for crowdsourcing medical imaging data in large public health screenings and other settings in the future.</p>
            </sec>
        </sec>
    </body>
    <back>
        <glossary>
            <title>Abbreviations</title>
            <def-list>
                <def-item>
                    <term id="abb1">AMT</term>
                    <def>
                        <p>Amazon Mechanical Turk</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb2">AUC</term>
                    <def>
                        <p>area under the curve</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb3">DR</term>
                    <def>
                        <p>diabetic retinopathy</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb4">HIT</term>
                    <def>
                        <p>human intelligence task</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb5">ROC</term>
                    <def>
                        <p>receiver-operator characteristic</p>
                    </def>
                </def-item>
            </def-list>
        </glossary>
        <ack>
            <p>This research was supported by the J. Arch McNamara, MD Memorial Fund for Retina Research and Education at Wills Eye Hospital. The sponsor had no role in the design, conduct, or decision to publish the research, nor did they have any role in the review or approval of the manuscript.</p>
            <p>This manuscript was presented at the American Society of Retinal Specialists Annual Meeting, August 2014.</p>
        </ack>
        <fn-group>
            <fn fn-type="conflict">
                <p>None declared.</p>
            </fn>
        </fn-group>
        <ref-list>
            <ref id="ref1">
                <label>1</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Beck</surname>
                            <given-names>RW</given-names>
                        </name>
                    </person-group>
                    <article-title>The burgeoning public health impact of diabetes: the role of the ophthalmologist</article-title>
                    <source>Arch Ophthalmol</source>
                    <year>2011</year>
                    <month>02</month>
                    <volume>129</volume>
                    <issue>2</issue>
                    <fpage>225</fpage>
                    <lpage>9</lpage>
                    <pub-id pub-id-type="doi">10.1001/archophthalmol.2010.331</pub-id>
                    <pub-id pub-id-type="medline">21320972</pub-id>
                    <pub-id pub-id-type="pii">129/2/225</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref2">
                <label>2</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Javitt</surname>
                            <given-names>JC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Canner</surname>
                            <given-names>JK</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Frank</surname>
                            <given-names>RG</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Steinwachs</surname>
                            <given-names>DM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sommer</surname>
                            <given-names>A</given-names>
                        </name>
                    </person-group>
                    <article-title>Detecting and treating retinopathy in patients with type I diabetes mellitus. A health policy model</article-title>
                    <source>Ophthalmology</source>
                    <year>1990</year>
                    <month>04</month>
                    <volume>97</volume>
                    <issue>4</issue>
                    <fpage>483</fpage>
                    <lpage>94; discussion 494</lpage>
                    <pub-id pub-id-type="medline">2109299</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref3">
                <label>3</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Javitt</surname>
                            <given-names>JC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Aiello</surname>
                            <given-names>LP</given-names>
                        </name>
                    </person-group>
                    <article-title>Cost-effectiveness of detecting and treating diabetic retinopathy</article-title>
                    <source>Ann Intern Med</source>
                    <year>1996</year>
                    <month>01</month>
                    <day>1</day>
                    <volume>124</volume>
                    <issue>1 Pt 2</issue>
                    <fpage>164</fpage>
                    <lpage>9</lpage>
                    <pub-id pub-id-type="medline">8554212</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref4">
                <label>4</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Jones</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Edwards</surname>
                            <given-names>RT</given-names>
                        </name>
                    </person-group>
                    <article-title>Diabetic retinopathy screening: a systematic review of the economic evidence</article-title>
                    <source>Diabet Med</source>
                    <year>2010</year>
                    <month>03</month>
                    <volume>27</volume>
                    <issue>3</issue>
                    <fpage>249</fpage>
                    <lpage>56</lpage>
                    <pub-id pub-id-type="doi">10.1111/j.1464-5491.2009.02870.x</pub-id>
                    <pub-id pub-id-type="medline">20536486</pub-id>
                    <pub-id pub-id-type="pii">DME2870</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref5">
                <label>5</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Schoenfeld</surname>
                            <given-names>ER</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Greene</surname>
                            <given-names>JM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wu</surname>
                            <given-names>SY</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Leske</surname>
                            <given-names>MC</given-names>
                        </name>
                    </person-group>
                    <article-title>Patterns of adherence to diabetes vision care guidelines: baseline findings from the Diabetic Retinopathy Awareness Program</article-title>
                    <source>Ophthalmology</source>
                    <year>2001</year>
                    <month>03</month>
                    <volume>108</volume>
                    <issue>3</issue>
                    <fpage>563</fpage>
                    <lpage>71</lpage>
                    <pub-id pub-id-type="medline">11237912</pub-id>
                    <pub-id pub-id-type="pii">S0161-6420(00)00600-X</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref6">
                <label>6</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Paz</surname>
                            <given-names>SH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Varma</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Klein</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wu</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Azen</surname>
                            <given-names>SP</given-names>
                        </name>
                        <collab>Los Angeles Latino Eye Study Group</collab>
                    </person-group>
                    <article-title>Noncompliance with vision care guidelines in Latinos with type 2 diabetes mellitus: the Los Angeles Latino Eye Study</article-title>
                    <source>Ophthalmology</source>
                    <year>2006</year>
                    <month>08</month>
                    <volume>113</volume>
                    <issue>8</issue>
                    <fpage>1372</fpage>
                    <lpage>7</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.ophtha.2006.04.018</pub-id>
                    <pub-id pub-id-type="medline">16769120</pub-id>
                    <pub-id pub-id-type="pii">S0161-6420(06)00566-5</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref7">
                <label>7</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lee</surname>
                            <given-names>PP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Feldman</surname>
                            <given-names>ZW</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ostermann</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brown</surname>
                            <given-names>DS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sloan</surname>
                            <given-names>FA</given-names>
                        </name>
                    </person-group>
                    <article-title>Longitudinal rates of annual eye examinations of persons with diabetes and chronic eye diseases</article-title>
                    <source>Ophthalmology</source>
                    <year>2003</year>
                    <month>10</month>
                    <volume>110</volume>
                    <issue>10</issue>
                    <fpage>1952</fpage>
                    <lpage>9</lpage>
                    <pub-id pub-id-type="doi">10.1016/S0161-6420(03)00817-0</pub-id>
                    <pub-id pub-id-type="medline">14522771</pub-id>
                    <pub-id pub-id-type="pii">S0161-6420(03)00817-0</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref8">
                <label>8</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Fong</surname>
                            <given-names>DS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sharza</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chen</surname>
                            <given-names>W</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Paschal</surname>
                            <given-names>JF</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ariyasu</surname>
                            <given-names>RG</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lee</surname>
                            <given-names>PP</given-names>
                        </name>
                    </person-group>
                    <article-title>Vision loss among diabetics in a group model Health Maintenance Organization (HMO)</article-title>
                    <source>Am J Ophthalmol</source>
                    <year>2002</year>
                    <month>02</month>
                    <volume>133</volume>
                    <issue>2</issue>
                    <fpage>236</fpage>
                    <lpage>41</lpage>
                    <pub-id pub-id-type="medline">11812428</pub-id>
                    <pub-id pub-id-type="pii">S0002939401013642</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref9">
                <label>9</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Sharp</surname>
                            <given-names>PF</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Olson</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Strachan</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hipwell</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ludbrook</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>O'Donnell</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wallace</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Goatman</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Grant</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Waugh</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>McHardy</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Forrester</surname>
                            <given-names>JV</given-names>
                        </name>
                    </person-group>
                    <article-title>The value of digital imaging in diabetic retinopathy</article-title>
                    <source>Health Technol Assess</source>
                    <year>2003</year>
                    <volume>7</volume>
                    <issue>30</issue>
                    <fpage>1</fpage>
                    <lpage>119</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.journalslibrary.nihr.ac.uk/hta/volume-7/issue-30" />
                    </comment>
                    <pub-id pub-id-type="medline">14604499</pub-id>
                    <pub-id pub-id-type="pii">94-18-05</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref10">
                <label>10</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Scanlon</surname>
                            <given-names>PH</given-names>
                        </name>
                    </person-group>
                    <article-title>The English national screening programme for sight-threatening diabetic retinopathy</article-title>
                    <source>J Med Screen</source>
                    <year>2008</year>
                    <volume>15</volume>
                    <issue>1</issue>
                    <fpage>1</fpage>
                    <lpage>4</lpage>
                    <pub-id pub-id-type="doi">10.1258/jms.2008.008015</pub-id>
                    <pub-id pub-id-type="medline">18416946</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref11">
                <label>11</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ng</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nathoo</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rudnisky</surname>
                            <given-names>CJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tennant</surname>
                            <given-names>MT</given-names>
                        </name>
                    </person-group>
                    <article-title>Improving access to eye care: teleophthalmology in Alberta, Canada</article-title>
                    <source>J Diabetes Sci Technol</source>
                    <year>2009</year>
                    <month>03</month>
                    <volume>3</volume>
                    <issue>2</issue>
                    <fpage>289</fpage>
                    <lpage>96</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/20144360" />
                    </comment>
                    <pub-id pub-id-type="medline">20144360</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2771508</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref12">
                <label>12</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Teng</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lefley</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Claremont</surname>
                            <given-names>D</given-names>
                        </name>
                    </person-group>
                    <article-title>Progress towards automated diabetic ocular screening: a review of image analysis and intelligent systems for diabetic retinopathy</article-title>
                    <source>Med Biol Eng Comput</source>
                    <year>2002</year>
                    <month>01</month>
                    <volume>40</volume>
                    <issue>1</issue>
                    <fpage>2</fpage>
                    <lpage>13</lpage>
                    <pub-id pub-id-type="medline">11954703</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref13">
                <label>13</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Abr&#224;moff</surname>
                            <given-names>Md</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Folk</surname>
                            <given-names>JC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Han</surname>
                            <given-names>DP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Walker</surname>
                            <given-names>JD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Williams</surname>
                            <given-names>DF</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Russell</surname>
                            <given-names>SR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Massin</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cochener</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gain</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tang</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lamard</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Moga</surname>
                            <given-names>DC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Quellec</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Niemeijer</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Automated analysis of retinal images for detection of referable diabetic retinopathy</article-title>
                    <source>JAMA Ophthalmol</source>
                    <year>2013</year>
                    <month>03</month>
                    <volume>131</volume>
                    <issue>3</issue>
                    <fpage>351</fpage>
                    <lpage>7</lpage>
                    <pub-id pub-id-type="doi">10.1001/jamaophthalmol.2013.1743</pub-id>
                    <pub-id pub-id-type="medline">23494039</pub-id>
                    <pub-id pub-id-type="pii">1668203</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref14">
                <label>14</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Trucco</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ruggeri</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Karnowski</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Giancardo</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chaum</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hubschman</surname>
                            <given-names>JP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Al-Diri</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cheung</surname>
                            <given-names>CY</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wong</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Abr&#224;moff</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lim</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kumar</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Burlina</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bressler</surname>
                            <given-names>NM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jelinek</surname>
                            <given-names>HF</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Meriaudeau</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Quellec</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Macgillivray</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dhillon</surname>
                            <given-names>B</given-names>
                        </name>
                    </person-group>
                    <article-title>Validating retinal fundus image analysis algorithms: issues and a proposal</article-title>
                    <source>Invest Ophthalmol Vis Sci</source>
                    <year>2013</year>
                    <month>05</month>
                    <volume>54</volume>
                    <issue>5</issue>
                    <fpage>3546</fpage>
                    <lpage>59</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.iovs.org/cgi/pmidlookup?view=long&#38;pmid=23794433" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1167/iovs.12-10347</pub-id>
                    <pub-id pub-id-type="medline">23794433</pub-id>
                    <pub-id pub-id-type="pii">54/5/3546</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref15">
                <label>15</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Brabham</surname>
                            <given-names>DC</given-names>
                        </name>
                    </person-group>
                    <source>Crowdsourcing. The MIT Press Essential Knowledge Series</source>
                    <year>2013</year>
                    <publisher-loc>Cambridge, MA</publisher-loc>
                    <publisher-name>MIT Press</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref16">
                <label>16</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Brabham</surname>
                            <given-names>DC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ribisl</surname>
                            <given-names>KM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kirchner</surname>
                            <given-names>TR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bernhardt</surname>
                            <given-names>JM</given-names>
                        </name>
                    </person-group>
                    <article-title>Crowdsourcing applications for public health</article-title>
                    <source>Am J Prev Med</source>
                    <year>2014</year>
                    <month>02</month>
                    <volume>46</volume>
                    <issue>2</issue>
                    <fpage>179</fpage>
                    <lpage>87</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.amepre.2013.10.016</pub-id>
                    <pub-id pub-id-type="medline">24439353</pub-id>
                    <pub-id pub-id-type="pii">S0749-3797(13)00589-8</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref17">
                <label>17</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Luengo-Oroz</surname>
                            <given-names>MA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Arranz</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Frean</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Crowdsourcing malaria parasite quantification: an online game for analyzing images of infected thick blood smears</article-title>
                    <source>J Med Internet Res</source>
                    <year>2012</year>
                    <volume>14</volume>
                    <issue>6</issue>
                    <fpage>e167</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2012/6/e167/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.2338</pub-id>
                    <pub-id pub-id-type="medline">23196001</pub-id>
                    <pub-id pub-id-type="pii">v14i6e167</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3510720</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref18">
                <label>18</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Mitry</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Peto</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hayat</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Morgan</surname>
                            <given-names>JE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Khaw</surname>
                            <given-names>KT</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Foster</surname>
                            <given-names>PJ</given-names>
                        </name>
                    </person-group>
                    <article-title>Crowdsourcing as a novel technique for retinal fundus photography classification: analysis of images in the EPIC Norfolk cohort on behalf of the UK Biobank Eye and Vision Consortium</article-title>
                    <source>PLoS One</source>
                    <year>2013</year>
                    <volume>8</volume>
                    <issue>8</issue>
                    <fpage>e71154</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0071154" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1371/journal.pone.0071154</pub-id>
                    <pub-id pub-id-type="medline">23990935</pub-id>
                    <pub-id pub-id-type="pii">PONE-D-13-23630</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3749186</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref19">
                <label>19</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>HK</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Horton</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bursell</surname>
                            <given-names>SE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cavallerano</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zimmer-Galler</surname>
                            <given-names>I</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tennant</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Abramoff</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chaum</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Debuc</surname>
                            <given-names>DC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Leonard-Martin</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Winchester</surname>
                            <given-names>M</given-names>
                        </name>
                        <collab>American Telemedicine Association Diabetic Retinopathy Telehealth Practice Recommendations Working Group</collab>
                        <name name-style="western">
                            <surname>Lawrence</surname>
                            <given-names>MG</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bauman</surname>
                            <given-names>W</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gardner</surname>
                            <given-names>WK</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hildebran</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Federman</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Telehealth practice recommendations for diabetic retinopathy, second edition</article-title>
                    <source>Telemed J E Health</source>
                    <year>2011</year>
                    <month>12</month>
                    <volume>17</volume>
                    <issue>10</issue>
                    <fpage>814</fpage>
                    <lpage>37</lpage>
                    <pub-id pub-id-type="doi">10.1089/tmj.2011.0075</pub-id>
                    <pub-id pub-id-type="medline">21970573</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref20">
                <label>20</label>
                <nlm-citation citation-type="web">
                    <source>Amazon Mechanical Turk</source>
                    <access-date>2014-08-25</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.mturk.com/mturk/welcome">https://www.mturk.com/mturk/welcome</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6S5lYMqkr</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref21">
                <label>21</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ilakkuvan</surname>
                            <given-names>V</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tacelosky</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ivey</surname>
                            <given-names>KC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Pearson</surname>
                            <given-names>JL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cantrell</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Vallone</surname>
                            <given-names>DM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Abrams</surname>
                            <given-names>DB</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kirchner</surname>
                            <given-names>TR</given-names>
                        </name>
                    </person-group>
                    <article-title>Cameras for Public Health Surveillance: A Methods Protocol for Crowdsourced Annotation of Point-of-Sale Photographs</article-title>
                    <source>JMIR Res Protoc</source>
                    <year>2014</year>
                    <volume>3</volume>
                    <issue>2</issue>
                    <fpage>e22</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.researchprotocols.org/2014/2/e22/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/resprot.3277</pub-id>
                    <pub-id pub-id-type="medline">24717168</pub-id>
                    <pub-id pub-id-type="pii">v3i2e22</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4004156</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref22">
                <label>22</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Turner</surname>
                            <given-names>AM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kirchhoff</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Capurro</surname>
                            <given-names>D</given-names>
                        </name>
                    </person-group>
                    <article-title>Using crowdsourcing technology for testing multilingual public health promotion materials</article-title>
                    <source>J Med Internet Res</source>
                    <year>2012</year>
                    <volume>14</volume>
                    <issue>3</issue>
                    <fpage>e79</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2012/3/e79/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.2063</pub-id>
                    <pub-id pub-id-type="medline">22664384</pub-id>
                    <pub-id pub-id-type="pii">v14i3e79</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3414863</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref23">
                <label>23</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Henshaw</surname>
                            <given-names>EJ</given-names>
                        </name>
                    </person-group>
                    <article-title>Too sick, not sick enough? Effects of treatment type and timing on depression stigma</article-title>
                    <source>J Nerv Ment Dis</source>
                    <year>2014</year>
                    <month>04</month>
                    <volume>202</volume>
                    <issue>4</issue>
                    <fpage>292</fpage>
                    <lpage>9</lpage>
                    <pub-id pub-id-type="doi">10.1097/NMD.0000000000000121</pub-id>
                    <pub-id pub-id-type="medline">24647215</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref24">
                <label>24</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Halkjelsvik</surname>
                            <given-names>T</given-names>
                        </name>
                    </person-group>
                    <article-title>Do disgusting and fearful anti-smoking advertisements increase or decrease support for tobacco control policies?</article-title>
                    <source>Int J Drug Policy</source>
                    <year>2014</year>
                    <month>07</month>
                    <volume>25</volume>
                    <issue>4</issue>
                    <fpage>744</fpage>
                    <lpage>7</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.drugpo.2014.01.021</pub-id>
                    <pub-id pub-id-type="medline">24630079</pub-id>
                    <pub-id pub-id-type="pii">S0955-3959(14)00024-3</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref25">
                <label>25</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Carter</surname>
                            <given-names>RR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>DiFeo</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bogie</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zhang</surname>
                            <given-names>GQ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sun</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Crowdsourcing awareness: exploration of the ovarian cancer knowledge gap through Amazon Mechanical Turk</article-title>
                    <source>PLoS One</source>
                    <year>2014</year>
                    <volume>9</volume>
                    <issue>1</issue>
                    <fpage>e85508</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0085508" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1371/journal.pone.0085508</pub-id>
                    <pub-id pub-id-type="medline">24465580</pub-id>
                    <pub-id pub-id-type="pii">PONE-D-13-31754</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3899016</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref26">
                <label>26</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Swan</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Crowdsourced health research studies: an important emerging complement to clinical trials in the public health research ecosystem</article-title>
                    <source>J Med Internet Res</source>
                    <year>2012</year>
                    <volume>14</volume>
                    <issue>2</issue>
                    <fpage>e46</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2012/2/e46/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.1988</pub-id>
                    <pub-id pub-id-type="medline">22397809</pub-id>
                    <pub-id pub-id-type="pii">v14i2e46</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3376509</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref27">
                <label>27</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Good</surname>
                            <given-names>BM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Loguercio</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Griffith</surname>
                            <given-names>OL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nanis</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wu</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Su</surname>
                            <given-names>AI</given-names>
                        </name>
                    </person-group>
                    <article-title>The Cure: Design and Evaluation of a Crowdsourcing Game for Gene Selection for Breast Cancer Survival Prediction</article-title>
                    <source>JMIR Serious Games</source>
                    <year>2014</year>
                    <month>07</month>
                    <day>29</day>
                    <volume>2</volume>
                    <issue>2</issue>
                    <fpage>e7</fpage>
                    <pub-id pub-id-type="doi">10.2196/games.3350</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref28">
                <label>28</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Dasgupta</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Freifeld</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brownstein</surname>
                            <given-names>JS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Menone</surname>
                            <given-names>CM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Surratt</surname>
                            <given-names>HL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Poppish</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Green</surname>
                            <given-names>JL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lavonas</surname>
                            <given-names>EJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dart</surname>
                            <given-names>RC</given-names>
                        </name>
                    </person-group>
                    <article-title>Crowdsourcing black market prices for prescription opioids</article-title>
                    <source>J Med Internet Res</source>
                    <year>2013</year>
                    <volume>15</volume>
                    <issue>8</issue>
                    <fpage>e178</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2013/8/e178/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.2810</pub-id>
                    <pub-id pub-id-type="medline">23956042</pub-id>
                    <pub-id pub-id-type="pii">v15i8e178</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3758048</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref29">
                <label>29</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Martin</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hanrahan</surname>
                            <given-names>BV</given-names>
                        </name>
                        <name name-style="western">
                            <surname>O'Neill</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Being a turker</article-title>
                    <source>Proceedings of the 17th ACM conference on Computer supported cooperative work &#38; social computing</source>
                    <year>2014</year>
                    <conf-name>17th ACM conference on Computer supported cooperative work &#38; social computing</conf-name>
                    <conf-date>February 15-19, 2014</conf-date>
                    <conf-loc>Baltimore, Maryland, USA</conf-loc>
                    <pub-id pub-id-type="doi">10.1145/2531602.2531663</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref30">
                <label>30</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ipeirotis</surname>
                            <given-names>PG</given-names>
                        </name>
                    </person-group>
                    <source>CeDER Working Papers-10-01</source>
                    <year>2010</year>
                    <access-date>2014-09-26</access-date>
                    <comment>Demographics of mechanical turk<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://hdl.handle.net/2451/29585">http://hdl.handle.net/2451/29585</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6StCwI3A8</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref31">
                <label>31</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Shotliff</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Duncan</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>Diabetic retinopathy: summary of grading and management criteria</article-title>
                    <source>Pract Diab Int</source>
                    <year>2006</year>
                    <month>11</month>
                    <volume>23</volume>
                    <issue>9</issue>
                    <fpage>418</fpage>
                    <lpage>420</lpage>
                    <pub-id pub-id-type="doi">10.1002/pdi.1029</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref32">
                <label>32</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Quenouille</surname>
                            <given-names>MH</given-names>
                        </name>
                    </person-group>
                    <article-title>Notes on bias in estimation</article-title>
                    <source>Biometrika</source>
                    <year>1956</year>
                    <volume>43</volume>
                    <issue>3-4</issue>
                    <fpage>353</fpage>
                    <lpage>360</lpage>
                    <pub-id pub-id-type="doi">10.1093/biomet/43.3-4.353</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref33">
                <label>33</label>
                <nlm-citation citation-type="web">
                    <source>Amazon Mechanical Turk Frequently Asked Questions</source>
                    <access-date>2014-08-25</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://requester.mturk.com/help/faq">https://requester.mturk.com/help/faq</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6S5ljfanT</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref34">
                <label>34</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Friedman</surname>
                            <given-names>DS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ali</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kourgialis</surname>
                            <given-names>N</given-names>
                        </name>
                    </person-group>
                    <article-title>Diabetic retinopathy in the developing world: how to approach identifying and treating underserved populations</article-title>
                    <source>Am J Ophthalmol</source>
                    <year>2011</year>
                    <month>02</month>
                    <volume>151</volume>
                    <issue>2</issue>
                    <fpage>192</fpage>
                    <lpage>4.e1</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.ajo.2010.10.014</pub-id>
                    <pub-id pub-id-type="medline">21251492</pub-id>
                    <pub-id pub-id-type="pii">S0002-9394(10)00813-5</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref35">
                <label>35</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Horton</surname>
                            <given-names>JJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chilton</surname>
                            <given-names>LB</given-names>
                        </name>
                    </person-group>
                    <article-title>The labor economics of paid crowdsourcing</article-title>
                    <source>Proceedings of the 11th ACM conference on Electronic commerce</source>
                    <year>2010</year>
                    <conf-name>11th ACM conference on Electronic commerce</conf-name>
                    <conf-date>June 7-11, 2010</conf-date>
                    <conf-loc>Cambridge, Massachusetts, USA</conf-loc>
                    <pub-id pub-id-type="doi">10.1145/1807342.1807376</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref36">
                <label>36</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Mason</surname>
                            <given-names>W</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Watts</surname>
                            <given-names>DJ</given-names>
                        </name>
                    </person-group>
                    <article-title>Financial incentives and the &#34;performance of crowds&#34;</article-title>
                    <source>Proceedings of the ACM SIGKDD Workshop on Human Computation</source>
                    <year>2009</year>
                    <conf-name>2009 ACM SIGKDD Workshop on Human Computation</conf-name>
                    <conf-date>June 28-July 1, 2009</conf-date>
                    <conf-loc>Paris, France</conf-loc>
                    <pub-id pub-id-type="doi">10.1145/1600150.1600175</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref37">
                <label>37</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Reed</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Raddick</surname>
                            <given-names>MJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lardner</surname>
                            <given-names>A</given-names>
                        </name>
                    </person-group>
                    <article-title>An exploratory factor analysis of motivations for participating in Zooniverse, a collection of virtual citizen science projects</article-title>
                    <source>46th Hawaii International Conference on System Sciences (HICSS)</source>
                    <year>2013</year>
                    <conf-name>46th Hawaii International Conference on System Sciences (HICSS)</conf-name>
                    <conf-date>January 7-10, 2013</conf-date>
                    <conf-loc>Wailea, Maui, HI</conf-loc>
                    <pub-id pub-id-type="doi">10.1109/HICSS.2013.85</pub-id>
                </nlm-citation>
            </ref>
        </ref-list>
    </back>
</article>
