<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<?covid-19-tdm?>
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v22i10e21299</article-id>
      <article-id pub-id-type="pmid">33001828</article-id>
      <article-id pub-id-type="doi">10.2196/21299</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Diagnostic Accuracy of Web-Based COVID-19 Symptom Checkers: Comparison Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Rashid Soron</surname>
            <given-names>Tanjir </given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Judson</surname>
            <given-names>Timothy</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Bellei</surname>
            <given-names>Ericles</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Munsch</surname>
            <given-names>Nicolas</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3543-0548</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Martin</surname>
            <given-names>Alistair</given-names>
          </name>
          <degrees>DPhil</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9735-2149</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Gruarin</surname>
            <given-names>Stefanie</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8700-9056</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Nateqi</surname>
            <given-names>Jama</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8194-2654</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Abdarahmane</surname>
            <given-names>Isselmou</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2341-5690</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Weingartner-Ortner</surname>
            <given-names>Rafael</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4786-0334</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Knapp</surname>
            <given-names>Bernhard</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Data Science Department</institution>
            <institution>Symptoma</institution>
            <addr-line>Landstraßer Gürtel 3</addr-line>
            <addr-line>Vienna, 1030</addr-line>
            <country>Austria</country>
            <phone>43 662458206</phone>
            <email>science@symptoma.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5714-7105</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Data Science Department</institution>
        <institution>Symptoma</institution>
        <addr-line>Vienna</addr-line>
        <country>Austria</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Medical Department</institution>
        <institution>Symptoma</institution>
        <addr-line>Attersee</addr-line>
        <country>Austria</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Internal Medicine</institution>
        <institution>Paracelsus Medical University</institution>
        <addr-line>Salzburg</addr-line>
        <country>Austria</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Bernhard Knapp <email>science@symptoma.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>10</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>6</day>
        <month>10</month>
        <year>2020</year>
      </pub-date>
      <volume>22</volume>
      <issue>10</issue>
      <elocation-id>e21299</elocation-id>
      <history>
        <date date-type="received">
          <day>15</day>
          <month>6</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>11</day>
          <month>7</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>27</day>
          <month>7</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>14</day>
          <month>9</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Nicolas Munsch, Alistair Martin, Stefanie Gruarin, Jama Nateqi, Isselmou Abdarahmane, Rafael Weingartner-Ortner, Bernhard Knapp. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 06.10.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://www.jmir.org/2020/10/e21299/" xlink:type="simple"/>
      <related-article related-article-type="commentary" id="v23i5e26148" ext-link-type="doi" xlink:href="10.2196/26148" vol="23" page="e26148" xlink:type="simple">https://www.jmir.org/2021/5/e26148</related-article>
      <related-article related-article-type="commentary" id="v23i5e26543" ext-link-type="doi" xlink:href="10.2196/26543" vol="23" page="e26543" xlink:type="simple">https://www.jmir.org/2021/5/e26543</related-article>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>A large number of web-based COVID-19 symptom checkers and chatbots have been developed; however, anecdotal evidence suggests that their conclusions are highly variable. To our knowledge, no study has evaluated the accuracy of COVID-19 symptom checkers in a statistically rigorous manner.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of this study is to evaluate and compare the diagnostic accuracies of web-based COVID-19 symptom checkers.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We identified 10 web-based COVID-19 symptom checkers, all of which were included in the study. We evaluated the COVID-19 symptom checkers by assessing 50 COVID-19 case reports alongside 410 non–COVID-19 control cases. A bootstrapping method was used to counter the unbalanced sample sizes and obtain confidence intervals (CIs). Results are reported as sensitivity, specificity, F1 score, and Matthews correlation coefficient (MCC).</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The classification task between COVID-19–positive and COVID-19–negative for “high risk” cases among the 460 test cases yielded (sorted by F1 score): Symptoma (F1=0.92, MCC=0.85), Infermedica (F1=0.80, MCC=0.61), US Centers for Disease Control and Prevention (CDC) (F1=0.71, MCC=0.30), Babylon (F1=0.70, MCC=0.29), Cleveland Clinic (F1=0.40, MCC=0.07), Providence (F1=0.40, MCC=0.05), Apple (F1=0.29, MCC=-0.10), Docyet (F1=0.27, MCC=0.29), Ada (F1=0.24, MCC=0.27) and Your.MD (F1=0.24, MCC=0.27). For “high risk” and “medium risk” combined the performance was: Symptoma (F1=0.91, MCC=0.83) Infermedica (F1=0.80, MCC=0.61), Cleveland Clinic (F1=0.76, MCC=0.47), Providence (F1=0.75, MCC=0.45), Your.MD (F1=0.72, MCC=0.33), CDC (F1=0.71, MCC=0.30), Babylon (F1=0.70, MCC=0.29), Apple (F1=0.70, MCC=0.25), Ada (F1=0.42, MCC=0.03), and Docyet (F1=0.27, MCC=0.29).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>We found that the number of correctly assessed COVID-19 and control cases varies considerably between symptom checkers, with different symptom checkers showing different strengths with respect to sensitivity and specificity. A good balance between sensitivity and specificity was only achieved by two symptom checkers.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>COVID-19</kwd>
        <kwd>symptom checkers</kwd>
        <kwd>benchmark</kwd>
        <kwd>digital health</kwd>
        <kwd>symptom</kwd>
        <kwd>chatbot</kwd>
        <kwd>accuracy</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>In the modern world, large numbers of patients initially turn to various web-based sources for self-diagnoses of health concerns before seeking diagnoses from a trained medical professional. However, web-based sources have inherent problems, such as misinformation, misunderstandings, misleading advertisements, and varying quality [<xref ref-type="bibr" rid="ref1">1</xref>]. Interactive web sources developed to provide web-based diagnoses are sometimes referred to as symptom checkers or chatbots [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. Based on a list of entered symptoms and other factors, these symptom checkers return a list of potential diseases.</p>
      <p>Web-based symptom checkers have become popular in the context of the novel COVID-19 pandemic, as access to physicians is reduced, concern in the population is high, and large amounts of misinformation are circulating the internet [<xref ref-type="bibr" rid="ref1">1</xref>]. On COVID-19 symptom checker web pages, users are asked a series of COVID-19–specific questions; upon completion, an association between the answers and COVID-19 is given alongside behavioral recommendations, such as self-isolation.</p>
      <p>In this context, COVID-19 symptom checkers are valuable tools for preassessment and screening during this pandemic; they can both ease pressure on clinicians and decrease footfall within hospitals. One example is practicing social distancing by not going to a physician’s waiting room when feeling sick. The importance of social distancing has been highlighted in the COVID-19 pandemic [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>], the 2009 H1N1 influenza pandemic [<xref ref-type="bibr" rid="ref6">6</xref>], and the 1918-1919 influenza pandemic [<xref ref-type="bibr" rid="ref7">7</xref>] and is reviewed in [<xref ref-type="bibr" rid="ref8">8</xref>]. Symptom checkers can also ease pressure on medical telephone hotlines [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>] by reducing the number of human phone operators needed.</p>
      <p>A large number of symptom checkers specific to COVID-19 have been developed. Empirical evidence (eg, a newspaper article [<xref ref-type="bibr" rid="ref11">11</xref>]) suggests that their conclusions differ, with possible implications for the quality of the symptom assessment. To our knowledge, there are no studies comparing and evaluating COVID-19 symptom checkers.</p>
      <p>In this paper, we present a study evaluating 10 different web-based COVID-19 symptom checkers using 50 COVID-19 cases extracted from the literature and 410 non–COVID-19 control cases of patients with other diseases. We found that the classifications of many patient cases by the COVID-19 symptom checkers differ. Therefore the accuracies of symptom checkers also differ.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>COVID-19 Symptom Checkers</title>
        <p>In April 2020, we conducted a Google search for COVID-19 symptom checkers using the search terms <italic>COVID-19 symptom checker</italic> and <italic>Corona symptom checker</italic>. All ten COVID-19 symptom checkers that we found and that were freely available on the internet between April 3 and 9, 2020, were included in this study (<xref ref-type="table" rid="table1">Table 1</xref>). Nine checkers were implemented in the English language, while one was in German. These symptom checkers were used in the versions available in this date range, and updates after this date were not considered for analysis.</p>
        <p>As a baseline for the performance evaluation of the 10 web-based COVID-19 symptom checkers, we developed two additional simplistic symptom checkers. These two checkers evaluate and weigh the presence of COVID-19 symptom frequencies provided by the World Health Organization (WHO) [<xref ref-type="bibr" rid="ref12">12</xref>] (see <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) based on vector distance (SF-DIST) and cosine similarity (SF-COS). These approaches can be implemented in a few lines of code (see <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>).</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>List of web-based COVID-19 symptom checkers included in this study.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>Name</td>
                <td>Reference</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Ada</td>
                <td>[<xref ref-type="bibr" rid="ref13">13</xref>]</td>
              </tr>
              <tr valign="top">
                <td>Apple</td>
                <td>[<xref ref-type="bibr" rid="ref14">14</xref>]</td>
              </tr>
              <tr valign="top">
                <td>Babylon</td>
                <td>[<xref ref-type="bibr" rid="ref15">15</xref>]</td>
              </tr>
              <tr valign="top">
                <td>CDC<sup>a</sup></td>
                <td>[<xref ref-type="bibr" rid="ref16">16</xref>]</td>
              </tr>
              <tr valign="top">
                <td>Cleveland Clinic</td>
                <td>[<xref ref-type="bibr" rid="ref17">17</xref>]</td>
              </tr>
              <tr valign="top">
                <td>Docyet</td>
                <td>[<xref ref-type="bibr" rid="ref18">18</xref>]</td>
              </tr>
              <tr valign="top">
                <td>Infermedica</td>
                <td>[<xref ref-type="bibr" rid="ref19">19</xref>]</td>
              </tr>
              <tr valign="top">
                <td>Providence</td>
                <td>[<xref ref-type="bibr" rid="ref20">20</xref>]</td>
              </tr>
              <tr valign="top">
                <td>Symptoma</td>
                <td>[<xref ref-type="bibr" rid="ref21">21</xref>]</td>
              </tr>
              <tr valign="top">
                <td>Your.MD</td>
                <td>[<xref ref-type="bibr" rid="ref22">22</xref>]</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>CDC: US Centers for Disease Control and Prevention.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Clinical Cases</title>
        <p>We used a total of 460 clinical cases to evaluate the performance of the COVID-19 symptom checkers. Each case lists both symptoms and the correct diagnosis alongside the age and sex of the patient when available. Details of the two case sets used are given below and in <xref ref-type="table" rid="table2">Table 2</xref>.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Number of symptoms and age and sex distributions in each case set (N=460).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="400"/>
            <col width="0"/>
            <col width="270"/>
            <col width="300"/>
            <thead>
              <tr valign="top">
                <td colspan="2"> Characteristic</td>
                <td colspan="3">Case set</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>COVID-19, n=50</td>
                <td>Control, n=410</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="5">
                  <bold>Number of symptoms</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Mean (SD)</td>
                <td>8.4 (4.1)</td>
                <td>9.8 (4.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Median</td>
                <td>7</td>
                <td>9</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Age (years)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Mean (SD)</td>
                <td>45.6 (16.9)</td>
                <td>38.6 (22.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Median</td>
                <td>45</td>
                <td>38</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Sex, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Male</td>
                <td>25 (50)</td>
                <td>238 (58)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Female</td>
                <td>21 (42)</td>
                <td>160 (39)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Unknown</td>
                <td>4 (8)</td>
                <td>12 (2.9)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <sec>
          <title>COVID-19 Cases</title>
          <p>A total of 50 COVID-19 cases were extracted by three trained physicians from the literature in March and April 2020 and are listed in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>. Each case describes one patient’s medical situation (ie, symptoms experienced or COVID-19 contacts). The symptoms of each case were extracted separately from the COVID-19 engine construction and evaluation. The physicians entering the symptoms did not know how the engine would react to their symptom lists. To the best of our knowledge, we included all cases available at the time except for severe edge cases (eg, several severe comorbidities causing unrelated symptoms). Changes to the initial symptom lists were not allowed later.</p>
        </sec>
        <sec>
          <title>Control Cases</title>
          <p>The COVID-19 case data enabled us to evaluate the sensitivity of the symptom checkers. To evaluate the specificity, 410 control cases from the <italic>British Medical Journal</italic> (BMJ) were also sourced [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. To allow a fair assessment, we only used cases containing at least one of the COVID-19 symptoms reported by the WHO [<xref ref-type="bibr" rid="ref12">12</xref>] (see <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>). Classifying nonrelevant cases (eg, a fracture) would overestimate the symptom checkers’ specificity. Furthermore, these patients would not consult a web-based COVID-19 symptom checker. None of the 410 BMJ cases lists COVID-19 as the diagnosis, as the cases where collected before the COVID-19 outbreak.</p>
        </sec>
      </sec>
      <sec>
        <title>Mapping of Symptoms and Addressing Missing Inputs and Questions</title>
        <p>Each of the symptom checkers has a different interface and different question sequences to reach the diagnosis. Therefore, we mapped the exhibited symptoms across our cases to the constrained input allowed by each checker via a synonym table and hierarchy created by a trained physician. For example, if a checker asked for “shortness of breath” but the case description listed “respiratory distress” or “(acute) dyspnea”, the symptom was still correctly used for this case and symptom checker.</p>
        <p>Not all cases contained answers to all the questions of a checker. In such cases, the answer “I don't know” was chosen; if the “I don't know” answer option did not exist in a checker, “No” was used. In contrast, if a case contained information that did not fit any of the questions of the checker, this information was not used for this checker.</p>
      </sec>
      <sec>
        <title>Accuracy Evaluation</title>
        <p>For statistical analysis, we used the following classification:</p>
        <list list-type="bullet">
          <list-item>
            <p>True-positive : COVID-19 case classified as COVID-19</p>
          </list-item>
          <list-item>
            <p>False-positive: non–COVID-19 case classified as COVID-19</p>
          </list-item>
          <list-item>
            <p>True-negative: non–COVID-19 case classified as non–COVID-19</p>
          </list-item>
          <list-item>
            <p>False-negative: COVID-19 case classified as non–COVID-19</p>
          </list-item>
        </list>
        <p>For each symptom checker, we calculated the following metrics:</p>
        <p>Sensitivity (true-positive rate):</p>
        <p>
          <graphic xlink:href="jmir_v22i10e21299_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </p>
        <p>Specificity (true-negative rate):</p>
        <p>
          <graphic xlink:href="jmir_v22i10e21299_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </p>
        <p>F1 score (harmonic mean of the precision and recall):</p>
        <p>
          <graphic xlink:href="jmir_v22i10e21299_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </p>
        <p>Matthews correlation coefficient (MCC):</p>
        <p>
          <graphic xlink:href="jmir_v22i10e21299_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </p>
      </sec>
      <sec>
        <title>Classification of the Outputs of the Symptom Checkers</title>
        <p>Most COVID-19 symptom checkers return human-readable text that contains an association between the entered symptoms and COVID-19. We classified these associations into three different categories: high risk, medium risk, and low risk. Respective examples of a high, medium, and low risk classification are “There is a high risk that COVID-19 is causing your symptoms,” “Your symptoms are worrisome and may be related to COVID-19,” and “There's nothing at present to suggest that you have coronavirus (COVID-19). Please practice physical/social distancing.” Our full mapping of text outputs to risk for all symptom checkers and all text outputs is given in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>.</p>
        <p>Some symptom checkers only have two possible outputs: COVID-19 risk or no COVID-19 risk. To compare symptom checkers with three and two risk levels, we performed two different analyses: (1) medium risk and high risk were treated as COVID-19–positive (and low risk was treated as COVID-19 as negative), and (2) high risk was treated as COVID-19–positive (and low risk and medium risk were treated as COVID-19–negative).</p>
      </sec>
      <sec>
        <title>Bootstrapping</title>
        <p>To evaluate the robustness of our statistical measures and account for the unbalanced dataset, we performed bootstrapping across our cases. A total of 3000 random samples consisting of 50 COVID-19 cases and 50 control cases was created by sampling with replacement from the original set of 50 COVID-19 cases and the 410 control cases.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p/>
      <p>To analyze the performance of the 10 web-based symptom checkers, we calculated the sensitivity and the specificity of each symptom checker based on the cases described in the method section. Scatterplots of the sensitivity and specificity to COVID-19 of the different symptom checkers are given in <xref rid="figure1" ref-type="fig">Figure 1</xref>, and detailed numerical values are provided in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref> and <xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>. These symptom checkers fall approximately into four groups: upper left corner, lower right corner, central region, and upper right corner.</p>
      <fig id="figure1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>Sensitivities and specificities of web-based COVID-19 symptom checkers to COVID-19 cases and controls. The means of the 3000 random samples and 90% bootstrap CIs are reported as dots and crosses, respectively. (A) High risk: A COVID-19–positive prediction is defined only by a high risk result returned by a symptom checker. (B) Medium-high risk: A COVID-19–positive prediction is defined by either a medium risk or high risk result returned by a symptom checker. CDC: US Centers for Disease Control and Prevention; SF-COS: symptom frequency based on cosine similarity; SF-DIST: symptom frequency based on vector distance.</p>
        </caption>
        <graphic xlink:href="jmir_v22i10e21299_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <p>Further analysis of the true and false case classifications of these groups shows that the group in the upper left corner is composed of symptom checkers that require the presence of one (or few) highly specific symptoms to classify a case as COVID-19–positive (eg, “intensive contact with a COVID-19–positive person”). In this way, these symptom checkers miss many patients who are positive for COVID-19 who did not exactly report this highly specific symptom. In contrast, these highly specific symptoms are rarely present in non–COVID-19 cases. This results in low sensitivity and high specificity.</p>
      <p>The group in the lower right corner is composed of symptom checkers that predict a case as COVID-19–positive based on the presence of one or few COVID-19 associated symptoms (eg, the presence of fever or cough is sufficient to predict a patient to be COVID-19–positive). These checkers classify almost every patient that has a respiratory disorder or viral infection as COVID-19–positive. As such, they do not miss many patients with COVID-19 but wrongly predict many patients who do not have COVID-19 to be COVID-19–positive. This results in low specificity and high sensitivity.</p>
      <p>The group in the more central region is composed of symptom checkers that use a more balanced prediction but exhibit limited success in correctly classifying patients with and without COVID-19.</p>
      <p>The group in the upper right corner is composed of symptom checkers that also use a more balanced model to associate symptoms to COVID-19; however, in this case, the classification of patients with and without COVID-19 is more successful. </p>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>We classified 50 COVID-19 case descriptions from the recent literature as well as 410 non–COVID-19 control cases using 10 different web-based COVID-19 symptom checkers. Only 2/10 symptom checkers showed a reasonably good balance between sensitivity and specificity (<xref rid="figure1" ref-type="fig">Figure 1</xref>). Most other checkers were either too sensitive, classifying almost all patients as COVID-19–positive, or too specific, classifying many patients with COVID-19 as COVID-19–negative (<xref rid="figure1" ref-type="fig">Figure 1</xref>). For example, our BMJ control cases included a patient suffering from a pulmonary disease who presented with various symptoms, including fever, cough, and shortness of breath, which are the three most frequent symptoms associated with COVID-19. Additional symptoms and risk factors were not considered by most checkers. Namely, loss of appetite, green sputum, and a history of smoking can be used to discern a correct diagnosis of COVID-19–negative.</p>
        <p>Furthermore, in terms of F1 score, most of the symptom checkers were outperformed by a simplistic symptom frequency vector approach; the F1 scores were 0.57 and 0.79 for SF-DIST and SF-COS, respectively. Notably, the cosine version showed surprisingly good results, outperforming 8/10 symptom checkers based on the F1 score.</p>
        <p>In contrast, it could also be argued that sensitivity is more important for a COVID-19 symptom checker than specificity (ie, numerous false-positive COVID-19 diagnoses are not of concern as long as no COVID-19 infections are missed). However, it is not difficult to create a symptom checker that is 100% sensitive by simply returning every test as COVID-19–positive. While no checker does this 100% of the time, some checkers tend to declare every person who reports any flu-like symptom to be COVID-19–positive. This assesses every patient with allergic asthma (“shortness of breath”), heatstroke (“fever”), or heavy smoker (“cough”) to be COVID-19–positive. Therefore, we believe that a healthy balance between sensitivity and specificity is necessary for a useful checker. However, from the figure in this paper, readers can decide for themselves which balance between sensitivity and specificity is most useful and select the corresponding checker.</p>
        <p>An additional aspect is that the developers of the 10 checkers may have had different purposes in mind during development. For example, they may have envisioned the checker to be a self-triage and recommendation tool or a likelihood predictor (as classified in [<xref ref-type="bibr" rid="ref2">2</xref>]). In our study, we found that most checkers provide a certain likelihood as well as recommendations; therefore, classification is difficult. Therefore, we did not further subgroup the checkers in our analysis.</p>
        <p>To our knowledge, this is the first scientific evaluation of web-based COVID-19 symptom checkers; however, there are a number of related studies evaluating symptom checkers. These include a study that evaluated 23 general-purpose symptom checkers based on 45 clinical case descriptions across a wide range of medical conditions and found that the correct diagnosis was listed among the top 20 results of the checkers in 58% of all cases on average [<xref ref-type="bibr" rid="ref2">2</xref>]. The aforementioned study design was extended to five additional symptom checkers using ear, nose, and throat (ENT) cases, showing similar results [<xref ref-type="bibr" rid="ref25">25</xref>]. Other evaluations include a study of symptom checkers used for knee pain cases; based on 527 patients and 26 knee problems, it was found that the physician’s diagnosis was present within the prediction list in 89% of the cases, while the specificity was only 27% [<xref ref-type="bibr" rid="ref26">26</xref>]. In another study, an analysis of an automated self-assessment triage system for university students prior to an in-person consultation with a physician found that the system’s urgency rating agreed perfectly in only 39% of cases; meanwhile, for the remaining cases, the system tended to be more risk-averse than the physician [<xref ref-type="bibr" rid="ref27">27</xref>]. Also, the applicability of web-based symptom checkers for 79 persons aged ≥50 years based on “think-aloud” protocols [<xref ref-type="bibr" rid="ref28">28</xref>], deep learning algorithms for medical imaging [<xref ref-type="bibr" rid="ref29">29</xref>], and services for urgent care [<xref ref-type="bibr" rid="ref3">3</xref>] were evaluated.</p>
        <p>The acceptability of the performance of a web-based symptom checker depends on the perspective and use of the results. In the case of COVID-19, a web-based assessment cannot fully replace a polymerase chain reaction (PCR) test, as some people are asymptomatic while others presenting with very specific COVID-19 symptoms may in fact have a very similar but different disease. Regardless, web-based COVID-19 symptom checkers can act as a first triage shield to avoid in-person physician visits or ease pressure on hospitals. Symptom checkers could even replace telephone triage lines in which non–medically trained personnel read a predefined sequence of questions. Although this was not part of this study, the authors believe that COVID-19 symptom checkers (if appropriately maintained and tested) may also be more reliable than the direct use of search engines such as Google or information via social media.</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>The strength of this study lies in the fact that it is based on a large number of real patients’ case descriptions from the literature (n=460) and a detailed evaluation of the best performing symptom checker in terms of F1 score (<xref ref-type="supplementary-material" rid="app8">Multimedia Appendix 8</xref>). In contrast, a potential weakness of this study lies in its use of real literature-based cases, which may have biased the test set to rather severe cases of COVID-19 because mild and uninteresting cases are usually not found in the literature. We countered this bias by not including extreme edge cases from the literature in our 50 COVID-19 cases. A limitation of our study is that the benchmarking represents a specific point in time (April 2020; see Methods) and underlying algorithms may change. However, this temporal limitation is present in all benchmarking studies as knowledge increases and software is updated. Another bias may be that our control case descriptions do not report a COVID-19 contact, even though, for example, a person with a cold may have had a COVID-19 contact (and did not become infected). Another limitation of this study is the nonstraightforward mapping of the symptom checker outputs to risk levels (<xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>). The interpretation of the textual output is debatable in some cases. We countered this by allowing three different risk levels and merging them in two different ways (see <xref rid="figure1" ref-type="fig">Figure 1</xref>A and <xref rid="figure1" ref-type="fig">Figure 1</xref>B). Also, every symptom checker output was classified by multiple persons until consensus was reached.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>Symptom checkers are being widely used in response to the global COVID-19 pandemic. As such, quality assessment of these tools is critical. We show that various web-based COVID-19 symptom checkers vary widely in their predictive capabilities, with some performing equivalently to random guessing while others show strength in sensitivity, specificity, or both.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Symptom frequencies used in Multimedia Appendix 2.</p>
        <media xlink:href="jmir_v22i10e21299_app1.pdf" xlink:title="PDF File  (Adobe PDF File), 28 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Pseudocode of symptom frequencies based on vector distance (SF-DIST) and cosine similarity (SF-COS).</p>
        <media xlink:href="jmir_v22i10e21299_app2.pdf" xlink:title="PDF File  (Adobe PDF File), 49 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>List of the COVID-19 cases.</p>
        <media xlink:href="jmir_v22i10e21299_app3.pdf" xlink:title="PDF File  (Adobe PDF File), 50 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>List of COVID-19 symptoms according to the World Health Organization.</p>
        <media xlink:href="jmir_v22i10e21299_app4.pdf" xlink:title="PDF File  (Adobe PDF File), 13 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Mappings between output texts and risk levels of the symptom checkers. All mappings were independently performed by two different persons, and conflicts were resolved by a third person’s opinion.</p>
        <media xlink:href="jmir_v22i10e21299_app5.pdf" xlink:title="PDF File  (Adobe PDF File), 33 KB"/>
      </supplementary-material>
      <supplementary-material id="app6">
        <label>Multimedia Appendix 6</label>
        <p>Full table of sensitivities, specificities, accuracies, F1 scores, and Matthews correlation coefficients for all symptom checkers (COVID-19–positive was defined by “high risk” for nonbinary symptom checkers).</p>
        <media xlink:href="jmir_v22i10e21299_app6.pdf" xlink:title="PDF File  (Adobe PDF File), 24 KB"/>
      </supplementary-material>
      <supplementary-material id="app7">
        <label>Multimedia Appendix 7</label>
        <p>Full table of sensitivities, specificities, accuracies, F1 scores, and Matthews correlation coefficients for all symptom checkers (COVID-19–positive was defined by “medium risk or “high risk” for nonbinary symptom checkers).</p>
        <media xlink:href="jmir_v22i10e21299_app7.pdf" xlink:title="PDF File  (Adobe PDF File), 24 KB"/>
      </supplementary-material>
      <supplementary-material id="app8">
        <label>Multimedia Appendix 8</label>
        <p>Constraining symptoms for Symptoma.</p>
        <media xlink:href="jmir_v22i10e21299_app8.pdf" xlink:title="PDF File  (Adobe PDF File), 101 KB"/>
      </supplementary-material>
      <supplementary-material id="app9">
        <label>Multimedia Appendix 9</label>
        <p>Sensitivity vs specificity for all symptom checkers and Symptoma input constraint respectively by each symptom checker.</p>
        <media xlink:href="jmir_v22i10e21299_app9.pdf" xlink:title="PDF File  (Adobe PDF File), 253 KB"/>
      </supplementary-material>
      <supplementary-material id="app10">
        <label>Multimedia Appendix 10</label>
        <p>Full table of sensitivities, specificities, accuracies, F1 scores, and Matthews correlation coefficients for Symptoma constrained by each symptom checker (COVID-19–positive was defined by “high risk” for nonbinary symptom checkers).</p>
        <media xlink:href="jmir_v22i10e21299_app10.pdf" xlink:title="PDF File  (Adobe PDF File), 33 KB"/>
      </supplementary-material>
      <supplementary-material id="app11">
        <label>Multimedia Appendix 11</label>
        <p>Full table of sensitivities, specificities, accuracies, F1 scores, and Matthews correlation coefficients for Symptoma constrained by each symptom checker (COVID-19–positive was defined by “medium risk” or “high risk” for nonbinary symptom checkers).</p>
        <media xlink:href="jmir_v22i10e21299_app11.pdf" xlink:title="PDF File  (Adobe PDF File), 33 KB"/>
      </supplementary-material>
      <supplementary-material id="app12">
        <label>Multimedia Appendix 12</label>
        <p>Pairwise comparisons between all symptom checkers and Symptoma based on the MCC only if the subset of symptoms used by one checker is also used for Symptoma.</p>
        <media xlink:href="jmir_v22i10e21299_app12.pdf" xlink:title="PDF File  (Adobe PDF File), 79 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">BMJ</term>
          <def>
            <p>British Medical Journal</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">ENT</term>
          <def>
            <p>ear, nose, and throat</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">MCC</term>
          <def>
            <p>Matthews correlation coefficient</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">SF-COS</term>
          <def>
            <p>symptom frequency based on cosine similarity</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">SF-DIST</term>
          <def>
            <p>symptom frequency based on vector distance</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">WHO</term>
          <def>
            <p>World Health Organization</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study received funding from the European Union’s Horizon 2020 research and innovation program under grant agreement no. 830017.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>All authors are employees of Symptoma GmbH. JN holds shares in Symptoma.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tasnim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hossain</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Mazumder</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Impact of Rumors and Misinformation on COVID-19 in Social Media</article-title>
          <source>J Prev Med Public Health</source>
          <year>2020</year>
          <month>05</month>
          <volume>53</volume>
          <issue>3</issue>
          <fpage>171</fpage>
          <lpage>174</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.doi.org/10.3961/jpmph.20.094"/>
          </comment>
          <pub-id pub-id-type="doi">10.3961/jpmph.20.094</pub-id>
          <pub-id pub-id-type="medline">32498140</pub-id>
          <pub-id pub-id-type="pii">jpmph.20.094</pub-id>
          <pub-id pub-id-type="pmcid">PMC7280809</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Semigran</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Linder</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gidengil</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mehrotra</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of symptom checkers for self diagnosis and triage: audit study</article-title>
          <source>BMJ</source>
          <year>2015</year>
          <month>07</month>
          <day>08</day>
          <volume>351</volume>
          <fpage>h3480</fpage>
          <pub-id pub-id-type="doi">10.1136/bmj.h3480</pub-id>
          <pub-id pub-id-type="medline">26157077</pub-id>
          <pub-id pub-id-type="pmcid">PMC4496786</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chambers</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cantrell</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Preston</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Baxter</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Booth</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Turner</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Digital and online symptom checkers and assessment services for urgent care to inform a new digital platform: a systematic review</article-title>
          <source>Health Services and Delivery Research</source>
          <year>2019</year>
          <volume>7</volume>
          <issue>29</issue>
          <fpage>online</fpage>
          <pub-id pub-id-type="doi">10.3310/hsdr07290</pub-id>
          <pub-id pub-id-type="medline">31433612</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Akl</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Duda</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Solo</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yaacoub</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Schünemann</surname>
              <given-names>HJ</given-names>
            </name>
            <collab>COVID-19 Systematic Urgent Review Group Effort (SURGE) study authors</collab>
          </person-group>
          <article-title>Physical distancing, face masks, and eye protection to prevent person-to-person transmission of SARS-CoV-2 and COVID-19: a systematic review and meta-analysis</article-title>
          <source>Lancet</source>
          <year>2020</year>
          <month>06</month>
          <day>01</day>
          <fpage>1973</fpage>
          <lpage>1987</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0140-6736(20)31142-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(20)31142-9</pub-id>
          <pub-id pub-id-type="medline">32497510</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(20)31142-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC7263814</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kissler</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Tedijanto</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Goldstein</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Grad</surname>
              <given-names>YH</given-names>
            </name>
            <name name-style="western">
              <surname>Lipsitch</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Projecting the transmission dynamics of SARS-CoV-2 through the postpandemic period</article-title>
          <source>Science</source>
          <year>2020</year>
          <month>05</month>
          <day>22</day>
          <volume>368</volume>
          <issue>6493</issue>
          <fpage>860</fpage>
          <lpage>868</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32291278"/>
          </comment>
          <pub-id pub-id-type="doi">10.1126/science.abb5793</pub-id>
          <pub-id pub-id-type="medline">32291278</pub-id>
          <pub-id pub-id-type="pii">science.abb5793</pub-id>
          <pub-id pub-id-type="pmcid">PMC7164482</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Haidari</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Modelling during an emergency: the 2009 H1N1 influenza pandemic</article-title>
          <source>Clin Microbiol Infect</source>
          <year>2013</year>
          <month>11</month>
          <volume>19</volume>
          <issue>11</issue>
          <fpage>1014</fpage>
          <lpage>22</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1198-743X(14)63003-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/1469-0691.12284</pub-id>
          <pub-id pub-id-type="medline">23800220</pub-id>
          <pub-id pub-id-type="pii">S1198-743X(14)63003-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Caley</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Philp</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>McCracken</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Quantifying social distancing arising from pandemic influenza</article-title>
          <source>J R Soc Interface</source>
          <year>2008</year>
          <month>06</month>
          <day>06</day>
          <volume>5</volume>
          <issue>23</issue>
          <fpage>631</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/17916550"/>
          </comment>
          <pub-id pub-id-type="doi">10.1098/rsif.2007.1197</pub-id>
          <pub-id pub-id-type="medline">17916550</pub-id>
          <pub-id pub-id-type="pii">91N575G127432871</pub-id>
          <pub-id pub-id-type="pmcid">PMC3226987</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Zviedrite</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Uzicanin</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Effectiveness of workplace social distancing measures in reducing influenza transmission: a systematic review</article-title>
          <source>BMC Public Health</source>
          <year>2018</year>
          <month>04</month>
          <day>18</day>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>518</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpublichealth.biomedcentral.com/articles/10.1186/s12889-018-5446-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12889-018-5446-1</pub-id>
          <pub-id pub-id-type="medline">29669545</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12889-018-5446-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC5907354</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kristal</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rowell</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kress</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Keeley</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jackson</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Piwnica-Worms</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Hendricks</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Long</surname>
              <given-names>TG</given-names>
            </name>
            <name name-style="western">
              <surname>Wallach</surname>
              <given-names>AB</given-names>
            </name>
          </person-group>
          <article-title>A Phone Call Away: New York's Hotline And Public Health In The Rapidly Changing COVID-19 Pandemic</article-title>
          <source>Health Aff (Millwood)</source>
          <year>2020</year>
          <month>08</month>
          <day>01</day>
          <volume>39</volume>
          <issue>8</issue>
          <fpage>1431</fpage>
          <lpage>1436</lpage>
          <pub-id pub-id-type="doi">10.1377/hlthaff.2020.00902</pub-id>
          <pub-id pub-id-type="medline">32525707</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Judson</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Odisho</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Neinstein</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Moriarty</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gleason</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Intinarelli</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzales</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Rapid design and implementation of an integrated patient self-triage and self-scheduling tool for COVID-19</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2020</year>
          <month>06</month>
          <day>01</day>
          <volume>27</volume>
          <issue>6</issue>
          <fpage>860</fpage>
          <lpage>866</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32267928"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocaa051</pub-id>
          <pub-id pub-id-type="medline">32267928</pub-id>
          <pub-id pub-id-type="pii">5817825</pub-id>
          <pub-id pub-id-type="pmcid">PMC7184478</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ross</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>I asked eight chatbots whether I had Covid-19. The answers ranged from ‘low’ risk to ‘start home isolation’</article-title>
          <source>STAT</source>
          <year>2020</year>
          <month>03</month>
          <day>23</day>
          <access-date>2020-09-30</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.statnews.com/2020/03/23/coronavirus-i-asked-eight-chatbots-whether-i-had-covid-19/">https://www.statnews.com/2020/03/23/coronavirus-i-asked-eight-chatbots-whether-i-had-covid-19/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="web">
          <article-title>Report of the WHO-China Joint Mission on Coronavirus Disease 2019 (COVID-19)</article-title>
          <source>World Health Organization</source>
          <year>2020</year>
          <month>02</month>
          <access-date>2020-09-30</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/docs/default-source/coronaviruse/who-china-joint-mission-on-covid-19-final-report.pdf">https://www.who.int/docs/default-source/coronaviruse/who-china-joint-mission-on-covid-19-final-report.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="web">
          <article-title>COVID-19 screener</article-title>
          <source>ada</source>
          <access-date>2020-04-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ada.com/covid-19-screener/">https://ada.com/covid-19-screener/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="web">
          <article-title>COVID-19 Screening Tool</article-title>
          <source>Apple</source>
          <access-date>2020-04-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.apple.com/covid19">https://www.apple.com/covid19</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="web">
          <article-title>COVID-19 Symptom Checker</article-title>
          <source>Babylon</source>
          <access-date>2020-04-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.babylonhealth.com/ask-babylon-chat">https://www.babylonhealth.com/ask-babylon-chat</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="web">
          <article-title>Symptoms of Coronavirus</article-title>
          <source>US Centers for Disease Control and Prevention</source>
          <access-date>2020-04-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/coronavirus/2019-ncov/symptoms-testing/symptoms.html">https://www.cdc.gov/coronavirus/2019-ncov/symptoms-testing/symptoms.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
          <article-title>Coronavirus Self-Checker</article-title>
          <source>Cleveland Clinic</source>
          <access-date>2020-04-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://covid19chat.clevelandclinic.org/">http://covid19chat.clevelandclinic.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="web">
          <article-title>Corona information. Webpage in German</article-title>
          <source>Docyet</source>
          <access-date>2020-04-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://corona.docyet.com/client/index.html">https://corona.docyet.com/client/index.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="web">
          <article-title>Symptomate</article-title>
          <source>Infermedica</source>
          <access-date>2020-04-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://symptomate.com/covid19/checkup/en/">https://symptomate.com/covid19/checkup/en/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="web">
          <article-title>Coronavirus assessment tool</article-title>
          <source>Providence</source>
          <access-date>2020-04-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://coronavirus.providence.org/">https://coronavirus.providence.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="web">
          <article-title>COVID-19 Chatbot Test</article-title>
          <source>COVID-19</source>
          <access-date>2020-04-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.symptoma.com/covid-19">https://www.symptoma.com/covid-19</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
          <source>Your.MD</source>
          <access-date>2020-04-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://webapp.your.md/login">https://webapp.your.md/login</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="web">
          <source>BMJ Best Practice</source>
          <access-date>2020-04-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bestpractice.bmj.com/info/">https://bestpractice.bmj.com/info/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="web">
          <article-title>BMJ Case Reports</article-title>
          <source>BMJ Journals</source>
          <access-date>2020-09-30</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://casereports.bmj.com">https://casereports.bmj.com</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nateqi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Krobath</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gruarin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lutz</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Dvorak</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gruschina</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ortner</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>From symptom to diagnosis-symptom checkers re-evaluated: Are symptom checkers finally sufficient and accurate to use? An update from the ENT perspective.</article-title>
          <source>HNO</source>
          <year>2019</year>
          <month>05</month>
          <day>16</day>
          <volume>67</volume>
          <issue>5</issue>
          <fpage>334</fpage>
          <lpage>342</lpage>
          <pub-id pub-id-type="doi">10.1007/s00106-019-0666-y</pub-id>
          <pub-id pub-id-type="medline">30993374</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00106-019-0666-y</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bisson</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Komm</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Bernas</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Fineberg</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Marzo</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Rauh</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Smolinski</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wind</surname>
              <given-names>WM</given-names>
            </name>
          </person-group>
          <article-title>Accuracy of a computer-based diagnostic program for ambulatory patients with knee pain</article-title>
          <source>Am J Sports Med</source>
          <year>2014</year>
          <month>10</month>
          <volume>42</volume>
          <issue>10</issue>
          <fpage>2371</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1177/0363546514541654</pub-id>
          <pub-id pub-id-type="medline">25073597</pub-id>
          <pub-id pub-id-type="pii">0363546514541654</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Poote</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>French</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Dale</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Powell</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>A study of automated self-assessment in a primary care student health centre setting</article-title>
          <source>J Telemed Telecare</source>
          <year>2014</year>
          <month>03</month>
          <day>18</day>
          <volume>20</volume>
          <issue>3</issue>
          <fpage>123</fpage>
          <lpage>127</lpage>
          <pub-id pub-id-type="doi">10.1177/1357633x14529246</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luger</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Houston</surname>
              <given-names>TK</given-names>
            </name>
            <name name-style="western">
              <surname>Suls</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Older adult experience of online diagnosis: results from a scenario-based think-aloud protocol</article-title>
          <source>J Med Internet Res</source>
          <year>2014</year>
          <month>01</month>
          <day>16</day>
          <volume>16</volume>
          <issue>1</issue>
          <fpage>e16</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2014/1/e16/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.2924</pub-id>
          <pub-id pub-id-type="medline">24434479</pub-id>
          <pub-id pub-id-type="pii">v16i1e16</pub-id>
          <pub-id pub-id-type="pmcid">PMC3906693</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nagendran</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lovejoy</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Gordon</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Komorowski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Harvey</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Topol</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ioannidis</surname>
              <given-names>JPA</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Maruthappu</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence versus clinicians: systematic review of design, reporting standards, and claims of deep learning studies</article-title>
          <source>BMJ</source>
          <year>2020</year>
          <month>03</month>
          <day>25</day>
          <volume>368</volume>
          <fpage>m689</fpage>
          <pub-id pub-id-type="doi">10.1136/bmj.m689</pub-id>
          <pub-id pub-id-type="medline">32213531</pub-id>
          <pub-id pub-id-type="pmcid">PMC7190037</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
