<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<?covid-19-tdm?>
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v23i7e28812</article-id>
      <article-id pub-id-type="pmid">34156964</article-id>
      <article-id pub-id-type="doi">10.2196/28812</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Evaluation of a Parsimonious COVID-19 Outbreak Prediction Model: Heuristic Modeling Approach Using Publicly Available Data Sets</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Basch</surname>
            <given-names>Corey</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Foraker</surname>
            <given-names>Randi</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Soshnikov</surname>
            <given-names>Sergey</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Pesälä</surname>
            <given-names>Samuli</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Gupta</surname>
            <given-names>Agrayan K</given-names>
          </name>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Indiana University</institution>
            <addr-line>107 S Indiana Ave</addr-line>
            <addr-line>Bloomington, IN, 47405</addr-line>
            <country>United States</country>
            <phone>1 812 855 4848</phone>
            <email>aggupta@iu.edu</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9600-4932</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Grannis</surname>
            <given-names>Shaun J</given-names>
          </name>
          <degrees>MD, MS</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8093-6639</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Kasthurirathne</surname>
            <given-names>Suranga N</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6630-4598</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Indiana University</institution>
        <addr-line>Bloomington, IN</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Center for Biomedical Informatics</institution>
        <institution>Regenstrief Institute</institution>
        <addr-line>Indianapolis, IN</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>School of Medicine</institution>
        <institution>Indiana University</institution>
        <addr-line>Indianapolis, IN</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Agrayan K Gupta <email>aggupta@iu.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>7</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>26</day>
        <month>7</month>
        <year>2021</year>
      </pub-date>
      <volume>23</volume>
      <issue>7</issue>
      <elocation-id>e28812</elocation-id>
      <history>
        <date date-type="received">
          <day>23</day>
          <month>3</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>5</day>
          <month>5</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>2</day>
          <month>6</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>12</day>
          <month>6</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Agrayan K Gupta, Shaun J Grannis, Suranga N Kasthurirathne. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 26.07.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2021/7/e28812" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The COVID-19 pandemic has changed public health policies and human and community behaviors through lockdowns and mandates. Governments are rapidly evolving policies to increase hospital capacity and supply personal protective equipment and other equipment to mitigate disease spread in affected regions. Current models that predict COVID-19 case counts and spread are complex by nature and offer limited explainability and generalizability. This has highlighted the need for accurate and robust outbreak prediction models that balance model parsimony and performance.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We sought to leverage readily accessible data sets extracted from multiple states to train and evaluate a parsimonious predictive model capable of identifying county-level risk of COVID-19 outbreaks on a day-to-day basis.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Our modeling approach leveraged the following data inputs: COVID-19 case counts per county per day and county populations. We developed an outbreak gold standard across California, Indiana, and Iowa. The model utilized a per capita running 7-day sum of the case counts per county per day and the mean cumulative case count to develop baseline values. The model was trained with data recorded between March 1 and August 31, 2020, and tested on data recorded between September 1 and October 31, 2020.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The model reported sensitivities of 81%, 92%, and 90% for California, Indiana, and Iowa, respectively. The precision in each state was above 85% while specificity and accuracy scores were generally &#62;95%.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our parsimonious model provides a generalizable and simple alternative approach to outbreak prediction. This methodology can be applied to diverse regions to help state officials and hospitals with resource allocation and to guide risk management, community education, and mitigation strategies.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>coronavirus</kwd>
        <kwd>COVID-19</kwd>
        <kwd>emerging outbreak</kwd>
        <kwd>modeling disease outbreak</kwd>
        <kwd>precision public health</kwd>
        <kwd>predictive modeling</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>The COVID-19 pandemic has impacted the health and well-being of individuals, communities, and economies worldwide at a hitherto unprecedented scale [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. On March 11, 2020, the World Health Organization declared COVID-19 a pandemic with over 118,000 confirmed cases and 4291 deaths in over 114 countries [<xref ref-type="bibr" rid="ref4">4</xref>]. To date, the pandemic has resulted in over 170 million confirmed cases, with over 3.5 million deaths globally [<xref ref-type="bibr" rid="ref5">5</xref>]. In the United States, 33 million people have had COVID-19 and more than 600,000 lives have been lost [<xref ref-type="bibr" rid="ref5">5</xref>].</p>
        <p>At the height of the pandemic, waves of viral outbreaks placed health systems across the globe under extended strain, leading to shortages in hospital beds, personal protective equipment, and health care personnel, which caused significant disruptions to health care delivery and loss of life [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. Experts have estimated the cumulative financial costs of the COVID-19 pandemic related to lost output and health reduction at US $16 trillion, or approximately 90% of the annual gross domestic product of the United States [<xref ref-type="bibr" rid="ref7">7</xref>].</p>
        <p>In contrast with historical pandemics, the availability of public and population health information systems has enabled researchers to collaborate on many research activities in response to COVID-19 [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. Since the onset of the pandemic, data scientists have collaborated with governmental organizations to create various public-facing COVID-19 dashboards that provide easy access to descriptive statistics and other metrics [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. Information on COVID-19–related mortality, utilization of health care resources, and recovery has been crucial in increasing situational awareness to inform ongoing pandemic response efforts across communities [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>].</p>
        <p>Most recently, COVID-19 infection rates have started to decrease in response to increased vaccination and efforts in public education [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. To date, 40% of the population of the United States is fully vaccinated [<xref ref-type="bibr" rid="ref16">16</xref>]. These improvements have led to an interest in relaxing or revoking various restrictions enforced at the state and county levels. While important to the well-being of both communities and economies, such decisions may be dangerous if undertaken without adequate preplanning and awareness of potential risks. As such, effective identification of potential outbreaks of COVID-19 offers the ability to inform decision-makers across governmental and public health sectors on how to resume normal day-to-day activities in their communities and deploy limited human and treatment resources to where they are most needed [<xref ref-type="bibr" rid="ref17">17</xref>].</p>
        <p>Previous studies have demonstrated the potential to apply analytical models to identify potential outbreaks in response to other diseases [<xref ref-type="bibr" rid="ref18">18</xref>]. However, these methods rely on large, complex data sets extracted from a specific health system or region [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>]. Such data sets may be challenging and time-consuming to collect, leading to delays in generating timely predictions. Further, models trained using locale-specific data sets may not be generalizable across other locations [<xref ref-type="bibr" rid="ref22">22</xref>], hindering the potential of reusing such models across other patient populations and regions. A variety of models are trained using complex algorithmic approaches such as neural networks and deep learning models. Such machine learning approaches may yield superior results but fail to achieve widespread acceptance [<xref ref-type="bibr" rid="ref23">23</xref>] owing to challenges in explainability and interpretation [<xref ref-type="bibr" rid="ref24">24</xref>].</p>
        <p>In contrast, a less complex modeling approach that uses a subset of easily obtainable key elements widely captured across broad geographic regions may be less challenging to develop. Further, such models may also deliver adequate predictive performance without sacrificing explainability and interpretability. Such parsimonious models may also present less risk of overfitting on training data sets, thus allowing for greater generalizability [<xref ref-type="bibr" rid="ref25">25</xref>].</p>
      </sec>
      <sec>
        <title>Objective</title>
        <p>We seek to leverage various readily accessible data sets extracted from multiple states to train and evaluate a parsimonious predictive model capable of identifying the county-level risk of COVID-19 outbreaks on a day-to-day basis.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Methods Overview</title>
        <p>We selected 3 states for our efforts in COVID-19 outbreak prediction modeling: California, Indiana, and Iowa. These states were selected on the basis of geographical factors, governmental regulations, and availability of data sets for public use. For example, Indiana and Iowa are similar in the number of counties and total populations [<xref ref-type="bibr" rid="ref26">26</xref>]. In contrast, California represented a more populous, urbanized state [<xref ref-type="bibr" rid="ref26">26</xref>]. We also considered the general completeness of reporting, the quality of basic COVID-19 data sources, and the accuracy of state tracking systems [<xref ref-type="bibr" rid="ref27">27</xref>].</p>
      </sec>
      <sec>
        <title>Data Extraction and Cleaning</title>
        <p>For each state, we extracted a variety of county-level data elements captured daily between March 1 and October 31, 2020. Data for Indiana were obtained from the Indiana State Department of Health, while data for Iowa and California were obtained from the New York Times web-based repository [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]. We selected March 1, 2020, as a start date as most states began collecting COVID-19 data at this time. October 31, 2020, marked the end of our analysis time period. Each data set was organized by county, state, and date reported using R [<xref ref-type="bibr" rid="ref29">29</xref>]. Several errors or omissions in the data sets were addressed as follows: days with negative case counts were changed to 0 and a county labeled as “unknown” reported by Iowa and California were removed from further evaluation.</p>
      </sec>
      <sec>
        <title>Preparation of a Gold Standard</title>
        <p>We created a gold standard indicating if each county under study was in an outbreak on any particular day. A human expert reviewer created the gold standard by assigning an outbreak label (with responses of “yes” or “no”) to each county or date combination, considering the following criteria:</p>
        <list list-type="order">
          <list-item>
            <p>How do case counts trend in each county? Is there a general baseline of cases over time?</p>
          </list-item>
          <list-item>
            <p>How large is the county’s population size (counties with more people report more cases)?</p>
          </list-item>
          <list-item>
            <p>Duration of the outbreak to assign a binary indicator of “outbreak detected” or “outbreak not detected” to each day and county.</p>
          </list-item>
        </list>
        <p>Based on our approach, a county could have multiple outbreaks over time. Outbreaks lasted a minimum of 3 days to account for testing lags as data were not always reported on the same day, especially during the initial phases of the pandemic [<xref ref-type="bibr" rid="ref30">30</xref>]. Furthermore, lower case counts at the end of an outbreak and on weekends owing to the closure of testing centers were also considered using 7-day average metrics.</p>
      </sec>
      <sec>
        <title>Model Building</title>
        <p>We created a heuristic outbreak prediction model using the training data sets obtained from all 3 states and evaluated its performance across the holdout test data sets and the gold standard. For each county, data collected between March 1 and August 31, 2020, were considered the training data set, while data collected between September 1 and October 31, 2020, were considered the test data set. As a preliminary step toward model development, we considered features used in other common models, including the susceptible-infected-recovered epidemic [<xref ref-type="bibr" rid="ref31">31</xref>] and time delay [<xref ref-type="bibr" rid="ref32">32</xref>] models, severity of lockdown measures [<xref ref-type="bibr" rid="ref33">33</xref>], cumulative cases (both reported and not reported) [<xref ref-type="bibr" rid="ref34">34</xref>], and daily test reports [<xref ref-type="bibr" rid="ref35">35</xref>]. Furthermore, predictive models for infectious diseases, such as susceptible-infected-recovered models, provide guidance on disease transmission and outbreak causation. The State of Wisconsin’s COVID-19 dashboard used a Case Rate metric defined as a per capita running 7-day sum of the case counts per county per day [<xref ref-type="bibr" rid="ref36">36</xref>]. Case Rate standardizes COVID-19 severity across counties of differing populations while also accounting for data lags and providing insight on transmission. We plotted Case Rate vs Indiana county populations to generate a general trendline that could differentiate between “outbreak detected” or “outbreak not detected” days. Our logarithmic graph semiaccurately depicted a horizontal line that separated outbreak days. The following steps were undertaken to leverage and apply the trendline results on states and counties with various populations.</p>
        <p>We started building the model by dividing counties on the basis of population size, initially at 100,000 population intervals. Since Case Rate is more sensitive to less populated counties, we added intervals for counties with less than 100,000 people. Each population interval was allocated an assigned Case Rate baseline value that served as a binary indicator for outbreak determination. We implemented a criterion where an outbreak was underway in counties if they were 4 SDs above the cumulative case count mean to account for data lag. As depicted in the system flow diagram (<xref rid="figure1" ref-type="fig">Figure 1</xref>), we established these parameter values and trained the model rules with the training data sets (data reported between March 1 and August 31, 2020). The train-to-test partition was approximately 71% to 29%, respectively, which is close to optimal for large data sets [<xref ref-type="bibr" rid="ref37">37</xref>]. Then, the model was tested against the gold standard with the test data sets (data reported between September 1 and October 31, 2020). <xref rid="figure1" ref-type="fig">Figure 1</xref> shows a flow diagram depicting our study approach.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Flow diagram providing an overview of the study methodology.</p>
          </caption>
          <graphic xlink:href="jmir_v23i7e28812_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Results Overview</title>
        <p>We collected data on a total of 249 counties from across all 3 states. <xref ref-type="table" rid="table1">Table 1</xref> presents descriptive statistics for each state, including the number of counties, population sizes, and urbanization to highlight each state’s fundamental differences [<xref ref-type="bibr" rid="ref26">26</xref>]. Previous studies have identified multiple factors in determining urban vs rural areas, including the total population, population density, and commuting flow [<xref ref-type="bibr" rid="ref38">38</xref>].</p>
        <p>Indiana and Iowa have similar county population distributions, with both having a majority of counties with less than 100,000 people. However, Indiana has more midsized counties with its largest county having almost 1 million people, while California has several counties having populations of more than 1 million people. Moreover, California has the highest percentage of the urban population (94.95%), with Indiana (72.44%) and Iowa (64.02%) far behind.</p>
        <p><xref rid="figure2" ref-type="fig">Figure 2</xref> provides an example visualization of outbreak determination in Cass County, Indiana, and Santa Barbara County, California, for gold standard preparation. Cass and Santa Barbara counties have populations of 37,689 and 446,499 people, respectively [<xref ref-type="bibr" rid="ref26">26</xref>].</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>State and county population sizes and population statistics based on census counts.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="610"/>
            <col width="0"/>
            <col width="120"/>
            <col width="0"/>
            <col width="120"/>
            <col width="0"/>
            <col width="120"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Census counts</td>
                <td colspan="2">Indiana</td>
                <td colspan="2">Iowa</td>
                <td>California</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="8">
                  <bold>County-level statistics</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Counties, n</td>
                <td colspan="2">92</td>
                <td colspan="2">99</td>
                <td colspan="2">58</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Counties where population is &#60;100,000 people, n</td>
                <td colspan="2">75</td>
                <td colspan="2">93</td>
                <td colspan="2">23</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Counties where the population is ≥100,000 and &#60;500,000 people, n</td>
                <td colspan="2">16</td>
                <td colspan="2">6</td>
                <td colspan="2">19</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Counties where the population is ≥500,000 and &#60;1,000,000 people, n</td>
                <td colspan="2">1</td>
                <td colspan="2">0</td>
                <td colspan="2">7</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Counties where the population is &#62;1,000,000 people, n</td>
                <td colspan="2">0</td>
                <td colspan="2">0</td>
                <td colspan="2">9</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Population of the smallest county (people), n</td>
                <td colspan="2">5875</td>
                <td colspan="2">3602</td>
                <td colspan="2">1129</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Population of the largest county (people), n</td>
                <td colspan="2">964,582</td>
                <td colspan="2">490,161</td>
                <td colspan="2">10,039,107</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Urban population, %</td>
                <td colspan="2">72.44</td>
                <td colspan="2">64.02</td>
                <td colspan="2">94.95</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Household income (US $), median</td>
                <td colspan="2">59,892</td>
                <td colspan="2">68,718</td>
                <td colspan="2">70,489</td>
              </tr>
              <tr valign="top">
                <td colspan="3">Case count per day, mean (SD)</td>
                <td colspan="2">7.98 (21.02)</td>
                <td colspan="2">6.18 (15.75)</td>
                <td>70.33 (231.86)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Visualization of the COVID-19 case counts in Cass County, Indiana, and Santa Barbara County, California, between March 1 and October 31, 2020. Outbreak days are indicated in red, and normal days are indicated in black.</p>
          </caption>
          <graphic xlink:href="jmir_v23i7e28812_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p><xref ref-type="table" rid="table2">Table 2</xref> shows the prevalence of the number of outbreaks and their durations in each state over the training, test, and total time periods. In Indiana and Iowa, the number of outbreaks doubled from the training to the test date range, despite the training data set being almost 3-fold as large as the test data set. Furthermore, the percentage of days in an outbreak between the training and test ranges quadrupled to 22.6% and 20.1% for Indiana and Iowa, respectively. The percentage of outbreak days in California remained relatively stable, while the average outbreak duration decreased from 47 days to 19 days. Because counties were our unit of analysis and since California had fewer and more populated counties than Indiana or Iowa, we believe that these factors contributed to the reduced number of outbreaks in California.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>COVID-19 outbreak prevalence descriptors from the gold standard. Indiana, Iowa, and California data sets were divided by training (March 1 to August 31, 2020), test (September 1 to October 31, 2020), and total (March 1 to October 31, 2020) date ranges to characterize the outbreak periods.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="280"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <col width="0"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <col width="0"/>
            <col width="80"/>
            <col width="80"/>
            <col width="80"/>
            <thead>
              <tr valign="top">
                <td>Prevalence descriptors</td>
                <td colspan="4">Indiana</td>
                <td colspan="4">Iowa</td>
                <td colspan="3">California</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Training</td>
                <td>Test</td>
                <td>Total</td>
                <td colspan="2">Training</td>
                <td>Test</td>
                <td>Total</td>
                <td colspan="2">Training</td>
                <td>Test</td>
                <td>Total</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Outbreaks, n</td>
                <td>26</td>
                <td>65</td>
                <td>83</td>
                <td colspan="2">43</td>
                <td>85</td>
                <td>114</td>
                <td colspan="2">35</td>
                <td>26</td>
                <td>40</td>
              </tr>
              <tr valign="top">
                <td>Outbreak duration (days), mean</td>
                <td>25.00</td>
                <td>19.18</td>
                <td>22.86</td>
                <td colspan="2">18.18</td>
                <td>14.62</td>
                <td>15.79</td>
                <td colspan="2">47.29</td>
                <td>19.31</td>
                <td>53.92</td>
              </tr>
              <tr valign="top">
                <td>Total outbreak days, n</td>
                <td>650</td>
                <td>1247</td>
                <td>1897</td>
                <td colspan="2">727</td>
                <td>1199</td>
                <td>1926</td>
                <td colspan="2">1655</td>
                <td>502</td>
                <td>2157</td>
              </tr>
              <tr valign="top">
                <td>Outbreak days, %</td>
                <td>3.86</td>
                <td>22.59</td>
                <td>8.45</td>
                <td colspan="2">4.01</td>
                <td>20.15</td>
                <td>7.97</td>
                <td colspan="2">15.59</td>
                <td>14.43</td>
                <td>5.24</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Model Rules</title>
        <p>Using the aforementioned data sets, we developed model parameters to predict COVID-19 outbreaks.</p>
        <p><xref rid="figure3" ref-type="fig">Figure 3</xref> shows a top-down decision tree for our model’s behavior. Rules and the assigned case rate associated with each population band used in the decision-making process are further outlined in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. As shown in <xref rid="figure3" ref-type="fig">Figure 3</xref>, the heuristic model determined that counties experienced an outbreak through the following methods:</p>
        <list list-type="order">
          <list-item>
            <p>For the specified population band, a county’s case rate on a given day was greater than the minimum case rate assigned to that population.</p>
          </list-item>
          <list-item>
            <p>The county’s case count on a specific day was greater than 12 and was 4 SDs above the rolling mean county-level COVID-19 case count.</p>
          </list-item>
          <list-item>
            <p>If a county met either requirement on a specific day, that county was considered to be “in outbreak.”</p>
          </list-item>
        </list>
        <p>By combining these rules with the previously developed gold standard, a confusion matrix was utilized to analyze the model’s performance.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Decision-making process of our heuristic model.</p>
          </caption>
          <graphic xlink:href="jmir_v23i7e28812_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p><xref ref-type="table" rid="table3">Table 3</xref> shows the results of the confusion matrix when the prediction model was applied to the curated gold standard during the test date range from September 1 to October 31, 2020. Sensitivity is the proportion of correctly identified positives, while specificity is the proportion of correctly identified negatives. All 4 key confusion matrix statistics—sensitivity, specificity, precision, and accuracy—were above 80% in each state during the test range. Model specificity and accuracy were &#62;94% for each state. This was attributed to most days being classified as true negatives, which are fundamentally more straightforward to detect than true positives. Model sensitivity for Indiana and Iowa was 10% greater than that of California. However, their precision was 11% and 7% lower, respectively. For Indiana and Iowa, this implies that the model computed fewer false-negative readings, which could be attributed to having increasingly prolonged outbreaks (<xref ref-type="table" rid="table1">Table 1</xref>). California’s higher precision but lower sensitivity implies that the model was more precise in predicting when outbreaks occurred but less successful in capturing all outbreaks.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Results of the model with the test data set relative to the gold standard.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td>Performance parameters</td>
                <td>Indiana</td>
                <td>Iowa</td>
                <td>California</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Test date range</td>
                <td>September 1 to October 31, 2020</td>
                <td>September 1 to October 31, 2020</td>
                <td>September 1 to October 31, 2020</td>
              </tr>
              <tr valign="top">
                <td>Sensitivity, %</td>
                <td>92.33</td>
                <td>90.05</td>
                <td>80.86</td>
              </tr>
              <tr valign="top">
                <td>Specificity, %</td>
                <td>95.56</td>
                <td>97.40</td>
                <td>99.57</td>
              </tr>
              <tr valign="top">
                <td>Precision, %</td>
                <td>85.04</td>
                <td>89.83</td>
                <td>96.96</td>
              </tr>
              <tr valign="top">
                <td>Accuracy, %</td>
                <td>94.86</td>
                <td>95.91</td>
                <td>96.85</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Our efforts resulted in the development of a heuristic model capable of detecting COVID-19 outbreaks, with predictive measures between 80% and 99%. The model had sensitivities of 92%, 90%, and 81% for Indiana, Iowa, and California, respectively. This indicates that the model was capable of identifying a clear majority of outbreaks across each state. The model also reported precision scores of 85%, 89%, and 96% for Indiana, Iowa, and California, respectively, which indicated that most positive predictions made by the model were accurate. These performance metrics indicate that the model is fit for use in real-life settings. Additionally, the training and test periods displayed distinct outbreak characteristics owing to the increased spread of COVID-19.</p>
        <p>These performance metrics are also notable, considering that the prevalence of outbreaks in training data sets was considerably low and could have resulted in weak predictive models had we used more traditional classification-based modeling approaches, which significantly underperform when trained using unbalanced data sets [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>]. As the pandemic progressed, each state attempted to enhance their data reporting systems. As described by Khakharia et al [<xref ref-type="bibr" rid="ref41">41</xref>], some regions reported sudden and significant changes in case counts, making it difficult for models to forecast future cases. Though outbreaks are not fundamentally different, the training and test data sets can be characterized separately. Despite the test range being shorter, Indiana and Iowa both reported twice as many outbreaks during the test period. This can be attributed to the second wave of COVID-19 that occurred during the test period as schools resumed, governors relaxed state lockdown laws, and people returned to work [<xref ref-type="bibr" rid="ref42">42</xref>]. For example, California was one of the last states to begin lifting restrictions in midsized and large counties, which may have contributed to relatively fewer outbreaks than those in Indiana and Iowa [<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>]. Thus, counties re-entered or for the first time realized outbreak periods during the test period.</p>
        <p>California remains a state of interest owing to the characterization of its outbreaks as well as predictive performance results on the holdout test data set. Unlike Indiana and Iowa, California has several counties with populations of over 1,000,000 people; furthermore, it was the only state with fewer outbreaks and a low percentage of outbreak days between the training and test periods. The California model revealed a significantly lower sensitivity but higher precision. Thus, to Indiana and Iowa, the California model captured proportionally fewer outbreaks but predicted the subset with greater precision.</p>
        <p>This parsimonious prediction model is easily replicable in other states, as it only utilizes county population and COVID-19 cases per day per county data. States can detect and predict outbreaks with high accuracy by following the model’s rules. Current outbreak prediction approaches are based on machine learning algorithms. Though they generally have very high accuracies, these models incorporate a variety of data points and can overfit models [<xref ref-type="bibr" rid="ref22">22</xref>]. The heuristic model’s data simplicity enables it to be easily implemented in other regions, especially those with limited reported systems. It is also an understandable and accurate method to relay a county’s current state of COVID-19 to the general public, who are not as informed in health metrics. In addition to public and internal communication, forecasting models can be applied to aid in outbreak preparation and community mitigation methods [<xref ref-type="bibr" rid="ref45">45</xref>].</p>
        <p>In addition to a high-performing heuristic model, our efforts also led to the development of a well-curated gold standard data set consisting of outbreak status for each county on a day-to-day basis. This data set is shown in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> to facilitate additional studies on this important issue.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Our study was impacted by limitations in data collection systems currently deployed by each state. The inconsistency of data reporting presented a significant systematic challenge for model building activities. For instance, states closed most COVID-19 testing centers on weekends, which led to lower case count values on Saturdays and Sundays. Further, many states did not publish most of their own COVID-19 data, which led us to obtain data on cases per day per county from the New York Times instead of a state’s Department of Health, the latter being more accurate. The New York Times would retroactively change case data, making it more unreliable since there were days with negative values.</p>
        <p>The lack of previous studies on curating gold standards on disease outbreaks also presents limitations. With no industry standard on defining an outbreak, we created the gold standard on the basis of intuition and the aforementioned specified criteria. Therefore, this process could have been subject to potential confounders, which may have influenced our model’s results. Furthermore, the rule-based model approach is subject to several limitations. Since the model incorporated a 7-day moving Case Rate, there was a lag at the tails of outbreaks as the increased case counts were not initially detected. Even with a parsimonious approach, the parameters derived from our results can greatly differ when applied to other regions. This uncertainty, resulting from parameters, social mandates, and vaccination, is a feature of any prediction model. We helped lessen this uncertainty through our generalizable approach demonstrated in diverse states.</p>
      </sec>
      <sec>
        <title>Future Prospects</title>
        <p>The ongoing COVID-19 pandemic has led most major institutions to allocate tremendous resources for its resolution. The model would benefit from a larger sample size of US states, and possibly regions worldwide, to test its generalizability on a more expansive scale. Additionally, we could expand the model’s data range for the third wave of cases and as the COVID-19 vaccine is distributed to a majority of the population, to determine its functionality beyond the scope of this study. Our results could also be translated to provide a clearer epidemiological outlook of diseases. Since the model can predict outbreaks with high accuracy, it could be tested on historical COVID-19 data to determine when most outbreaks occurred easily in a particular region. Moreover, trends and patterns were found across outbreaks among various factors such as lockdown policies, air pollution levels, and civilian obedience. Understanding the causes of outbreaks presents interesting findings related to public policy adaptation in current and future situations.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This study presents an accurate, generalizable, and explainable COVID-19 outbreak prediction model. The model reported sensitivity scores of &#62;90% in Indiana and Iowa and &#62;80% in California. Furthermore, model specificity and accuracy scores were &#62;94% in every state. These results, coupled with the minimal data inputs required, creates an explainable and easy-to-implement model that governments and policymakers can utilize to assess COVID-19 severity across diverse geographic regions. Future studies are required to test the model in other states and countries by using more recent data. Moreover, the model should be used to identify outbreaks to investigate correlations among external factors such as socioeconomic risks, air pollution, county-level laws, and outbreak development.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Population bands with their respective minimum case rates.</p>
        <media xlink:href="jmir_v23i7e28812_app1.xls" xlink:title="XLS File  (Microsoft Excel File), 26 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Outbreak gold standard for each county in California, Indiana, and Iowa per day.</p>
        <media xlink:href="jmir_v23i7e28812_app2.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 38 KB"/>
      </supplementary-material>
    </app-group>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Estiri</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Strasser</surname>
              <given-names>ZH</given-names>
            </name>
            <name name-style="western">
              <surname>Klann</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Naseri</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wagholikar</surname>
              <given-names>KB</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SN</given-names>
            </name>
          </person-group>
          <article-title>Predicting COVID-19 mortality with electronic medical records</article-title>
          <source>NPJ Digit Med</source>
          <year>2021</year>
          <month>02</month>
          <day>04</day>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>15</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-021-00383-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-021-00383-x</pub-id>
          <pub-id pub-id-type="medline">33542473</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-021-00383-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC7862405</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hartley</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Perencevich</surname>
              <given-names>EN</given-names>
            </name>
          </person-group>
          <article-title>Public Health Interventions for COVID-19: Emerging Evidence and Implications for an Evolving Public Health Crisis</article-title>
          <source>JAMA</source>
          <year>2020</year>
          <month>05</month>
          <day>19</day>
          <volume>323</volume>
          <issue>19</issue>
          <fpage>1908</fpage>
          <lpage>1909</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2020.5910</pub-id>
          <pub-id pub-id-type="medline">32275299</pub-id>
          <pub-id pub-id-type="pii">2764656</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baker</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bloom</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Terry</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>COVID-Induced Economic Uncertainty</article-title>
          <source>National Bureau of Economic Research</source>
          <year>2020</year>
          <access-date>2021-07-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nber.org/system/files/working_papers/w26983/w26983.pdf">https://www.nber.org/system/files/working_papers/w26983/w26983.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McNeil</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Coronavirus Has Become a Pandemic</article-title>
          <source>The New York Times</source>
          <access-date>2021-07-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nytimes.com/2020/03/11/health/coronavirus-pandemic-who.html">https://www.nytimes.com/2020/03/11/health/coronavirus-pandemic-who.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="web">
          <article-title>Coronavirus (Covid-19) Data</article-title>
          <source>The New York Times Developer Network</source>
          <access-date>2021-07-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://developer.nytimes.com/covid">https://developer.nytimes.com/covid</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Haase</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>XQ</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>BX</given-names>
            </name>
          </person-group>
          <article-title>The experiences of health-care providers during the COVID-19 crisis in China: a qualitative study</article-title>
          <source>Lancet Glob Health</source>
          <year>2020</year>
          <month>06</month>
          <volume>8</volume>
          <issue>6</issue>
          <fpage>e790</fpage>
          <lpage>e798</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2214-109X(20)30204-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S2214-109X(20)30204-7</pub-id>
          <pub-id pub-id-type="medline">32573443</pub-id>
          <pub-id pub-id-type="pii">S2214-109X(20)30204-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC7190296</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cutler</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Summers</surname>
              <given-names>LH</given-names>
            </name>
          </person-group>
          <article-title>The COVID-19 Pandemic and the $16 Trillion Virus</article-title>
          <source>JAMA</source>
          <year>2020</year>
          <month>10</month>
          <day>20</day>
          <volume>324</volume>
          <issue>15</issue>
          <fpage>1495</fpage>
          <lpage>1496</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33044484"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jama.2020.19759</pub-id>
          <pub-id pub-id-type="medline">33044484</pub-id>
          <pub-id pub-id-type="pii">2771764</pub-id>
          <pub-id pub-id-type="pmcid">PMC7604733</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rubin</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>NIH Launches Platform to Serve as Depository for COVID-19 Medical Data</article-title>
          <source>JAMA</source>
          <year>2020</year>
          <month>07</month>
          <day>28</day>
          <volume>324</volume>
          <issue>4</issue>
          <fpage>326</fpage>
          <pub-id pub-id-type="doi">10.1001/jama.2020.12646</pub-id>
          <pub-id pub-id-type="medline">32720992</pub-id>
          <pub-id pub-id-type="pii">2768786</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bennett</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Moffitt</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hajagos</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Amor</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Anand</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bissell</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Bradwell</surname>
              <given-names>KR</given-names>
            </name>
            <name name-style="western">
              <surname>Bremer</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Byrd</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Denham</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>DeWitt</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Gabriel</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Garibaldi</surname>
              <given-names>BT</given-names>
            </name>
            <name name-style="western">
              <surname>Girvin</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Guinney</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>EL</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Jimenez</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kavuluru</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kostka</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lehmann</surname>
              <given-names>HP</given-names>
            </name>
            <name name-style="western">
              <surname>Levitt</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Mallipattu</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Manna</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>McMurry</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Morris</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Muschelli</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Neumann</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Palchuk</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Pfaff</surname>
              <given-names>ER</given-names>
            </name>
            <name name-style="western">
              <surname>Qian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Qureshi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Russell</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Spratt</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Walden</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Wooldridge</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Yoo</surname>
              <given-names>YJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>XT</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Austin</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Saltz</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Gersing</surname>
              <given-names>KR</given-names>
            </name>
            <name name-style="western">
              <surname>Haendel</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Chute</surname>
              <given-names>CG</given-names>
            </name>
          </person-group>
          <article-title>The National COVID Cohort Collaborative: Clinical Characterization and Early Severity Prediction</article-title>
          <source>medRxiv.</source>
          <comment>Preprint posted online January 23, 2021
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1101/2021.01.12.21249511"/>
          </comment>
          <pub-id pub-id-type="doi">10.1101/2021.01.12.21249511</pub-id>
          <pub-id pub-id-type="medline">33469592</pub-id>
          <pub-id pub-id-type="pmcid">PMC7814838</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dixon</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Grannis</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>McAndrews</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Broyles</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Mikels-Carrasco</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Wiensch</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Tachinardi</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Embi</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>Leveraging Data Visualization and a Statewide Health Information Exchange to Support COVID-19 Surveillance and Response: Application of Public Health Informatics</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2021</year>
          <month>01</month>
          <day>22</day>
          <fpage>ocab004</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33480419"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocab004</pub-id>
          <pub-id pub-id-type="medline">33480419</pub-id>
          <pub-id pub-id-type="pii">6106131</pub-id>
          <pub-id pub-id-type="pmcid">PMC7928924</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gardner</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>An interactive web-based dashboard to track COVID-19 in real time</article-title>
          <source>Lancet Infect Dis</source>
          <year>2020</year>
          <month>05</month>
          <volume>20</volume>
          <issue>5</issue>
          <fpage>533</fpage>
          <lpage>534</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32087114"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S1473-3099(20)30120-1</pub-id>
          <pub-id pub-id-type="medline">32087114</pub-id>
          <pub-id pub-id-type="pii">S1473-3099(20)30120-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC7159018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jewell</surname>
              <given-names>NP</given-names>
            </name>
            <name name-style="western">
              <surname>Lewnard</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Jewell</surname>
              <given-names>BL</given-names>
            </name>
          </person-group>
          <article-title>Caution Warranted: Using the Institute for Health Metrics and Evaluation Model for Predicting the Course of the COVID-19 Pandemic</article-title>
          <source>Ann Intern Med</source>
          <year>2020</year>
          <month>08</month>
          <day>04</day>
          <volume>173</volume>
          <issue>3</issue>
          <fpage>226</fpage>
          <lpage>227</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.acpjournals.org/doi/abs/10.7326/M20-1565?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub%3dpubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.7326/M20-1565</pub-id>
          <pub-id pub-id-type="medline">32289150</pub-id>
          <pub-id pub-id-type="pii">2764774</pub-id>
          <pub-id pub-id-type="pmcid">PMC7197035</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Budd</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Lampos</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Zhuang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Edelstein</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rees</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Emery</surname>
              <given-names>VC</given-names>
            </name>
            <name name-style="western">
              <surname>Stevens</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Keegan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Short</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Pillay</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Manley</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Cox</surname>
              <given-names>IJ</given-names>
            </name>
            <name name-style="western">
              <surname>Heymann</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>McKendry</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <article-title>Digital technologies in the public-health response to COVID-19</article-title>
          <source>Nat Med</source>
          <year>2020</year>
          <month>08</month>
          <volume>26</volume>
          <issue>8</issue>
          <fpage>1183</fpage>
          <lpage>1192</lpage>
          <pub-id pub-id-type="doi">10.1038/s41591-020-1011-4</pub-id>
          <pub-id pub-id-type="medline">32770165</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-020-1011-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dagan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Barda</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kepten</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Miron</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Perchik</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Katz</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Hernán</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Lipsitch</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Reis</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Balicer</surname>
              <given-names>RD</given-names>
            </name>
          </person-group>
          <article-title>BNT162b2 mRNA Covid-19 Vaccine in a Nationwide Mass Vaccination Setting</article-title>
          <source>N Engl J Med</source>
          <year>2021</year>
          <month>04</month>
          <day>15</day>
          <volume>384</volume>
          <issue>15</issue>
          <fpage>1412</fpage>
          <lpage>1423</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33626250"/>
          </comment>
          <pub-id pub-id-type="doi">10.1056/NEJMoa2101765</pub-id>
          <pub-id pub-id-type="medline">33626250</pub-id>
          <pub-id pub-id-type="pmcid">PMC7944975</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Del Rio</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Malani</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>COVID-19 in 2021-Continuing Uncertainty</article-title>
          <source>JAMA</source>
          <year>2021</year>
          <month>04</month>
          <day>13</day>
          <volume>325</volume>
          <issue>14</issue>
          <fpage>1389</fpage>
          <lpage>1390</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2021.3760</pub-id>
          <pub-id pub-id-type="medline">33662092</pub-id>
          <pub-id pub-id-type="pii">2777391</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="web">
          <article-title>COVID Data Tracker</article-title>
          <source>Centers for Disease Control and Prevention</source>
          <access-date>2021-07-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://covid.cdc.gov/covid-data-tracker/#datatracker-home">https://covid.cdc.gov/covid-data-tracker/#datatracker-home</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weissman</surname>
              <given-names>GE</given-names>
            </name>
            <name name-style="western">
              <surname>Crane-Droesch</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chivers</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Luong</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Hanish</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>MZ</given-names>
            </name>
            <name name-style="western">
              <surname>Lubken</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Becker</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Draugelis</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Anesi</surname>
              <given-names>GL</given-names>
            </name>
            <name name-style="western">
              <surname>Brennan</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Christie</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Hanson</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Mikkelsen</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Halpern</surname>
              <given-names>SD</given-names>
            </name>
          </person-group>
          <article-title>Locally Informed Simulation to Predict Hospital Capacity Needs During the COVID-19 Pandemic</article-title>
          <source>Ann Intern Med</source>
          <year>2020</year>
          <month>07</month>
          <day>07</day>
          <volume>173</volume>
          <issue>1</issue>
          <fpage>21</fpage>
          <lpage>28</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.acpjournals.org/doi/abs/10.7326/M20-1260?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub%3dpubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.7326/M20-1260</pub-id>
          <pub-id pub-id-type="medline">32259197</pub-id>
          <pub-id pub-id-type="pii">2764423</pub-id>
          <pub-id pub-id-type="pmcid">PMC7153364</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Identifying the outbreak signal of COVID-19 before the response of the traditional disease monitoring system</article-title>
          <source>PLoS Negl Trop Dis</source>
          <year>2020</year>
          <month>10</month>
          <volume>14</volume>
          <issue>10</issue>
          <fpage>e0008758</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pntd.0008758"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pntd.0008758</pub-id>
          <pub-id pub-id-type="medline">33001985</pub-id>
          <pub-id pub-id-type="pii">PNTD-D-20-00852</pub-id>
          <pub-id pub-id-type="pmcid">PMC7553315</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adnan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Newbern</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Sherwood</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Baker</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wood</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Potential Early Identification of a Large Campylobacter Outbreak Using Alternative Surveillance Data Sources: Autoregressive Modelling and Spatiotemporal Clustering</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2020</year>
          <month>09</month>
          <day>17</day>
          <volume>6</volume>
          <issue>3</issue>
          <fpage>e18281</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2020/3/e18281/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/18281</pub-id>
          <pub-id pub-id-type="medline">32940617</pub-id>
          <pub-id pub-id-type="pii">v6i3e18281</pub-id>
          <pub-id pub-id-type="pmcid">PMC7530686</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tseng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shih</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Developing epidemic forecasting models to assist disease surveillance for influenza with electronic health records</article-title>
          <source>Int J Comput Appl</source>
          <year>2019</year>
          <month>08</month>
          <day>05</day>
          <volume>42</volume>
          <issue>6</issue>
          <fpage>616</fpage>
          <lpage>621</lpage>
          <pub-id pub-id-type="doi">10.1080/1206212x.2019.1633762</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Verma</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kishore</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sondh</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Aggarwal</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kathirvel</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Google Search Trends Predicting Disease Outbreaks: An Analysis from India</article-title>
          <source>Healthc Inform Res</source>
          <year>2018</year>
          <month>10</month>
          <volume>24</volume>
          <issue>4</issue>
          <fpage>300</fpage>
          <lpage>308</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.e-hir.org/DOIx.php?id=10.4258/hir.2018.24.4.300"/>
          </comment>
          <pub-id pub-id-type="doi">10.4258/hir.2018.24.4.300</pub-id>
          <pub-id pub-id-type="medline">30443418</pub-id>
          <pub-id pub-id-type="pmcid">PMC6230529</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dexter</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Grannis</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dixon</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kasthurirathne</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Generalization of Machine Learning Approaches to Identify Notifiable Conditions from a Statewide Health Information Exchange</article-title>
          <source>AMIA Jt Summits Transl Sci Proc</source>
          <year>2020</year>
          <volume>2020</volume>
          <fpage>152</fpage>
          <lpage>161</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32477634"/>
          </comment>
          <pub-id pub-id-type="medline">32477634</pub-id>
          <pub-id pub-id-type="pmcid">PMC7233074</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sáez</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Romero</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Conejero</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>García-Gómez</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Potential limitations in COVID-19 machine learning due to data source variability: A case study in the nCov2019 dataset</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2021</year>
          <month>02</month>
          <day>15</day>
          <volume>28</volume>
          <issue>2</issue>
          <fpage>360</fpage>
          <lpage>364</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33027509"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocaa258</pub-id>
          <pub-id pub-id-type="medline">33027509</pub-id>
          <pub-id pub-id-type="pii">5919075</pub-id>
          <pub-id pub-id-type="pmcid">PMC7797735</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ghorbani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Abid</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Interpretation of Neural Networks Is Fragile</article-title>
          <source>AAAI</source>
          <year>2019</year>
          <month>07</month>
          <day>17</day>
          <volume>33</volume>
          <fpage>3681</fpage>
          <lpage>3688</lpage>
          <pub-id pub-id-type="doi">10.1609/aaai.v33i01.33013681</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vandekerckhove</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Matzke</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wagenmakers</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Model comparisonthe principle of parsimony</article-title>
          <source>The Oxford handbook of computationalmathematical psychology</source>
          <year>2015</year>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>Oxford University Press</publisher-name>
          <fpage>300</fpage>
          <lpage>319</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="web">
          <article-title>County Population Totals: 2010-2019</article-title>
          <source>United States Census Bureau</source>
          <access-date>2021-07-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.census.gov/data/tables/time-series/demo/popest/2010s-counties-total.html">https://www.census.gov/data/tables/time-series/demo/popest/2010s-counties-total.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="web">
          <article-title>State Reporting Assessments</article-title>
          <source>The COVID Tracking Project</source>
          <access-date>2021-07-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://covidtracking.com/about-data/state-reporting-assessments">https://covidtracking.com/about-data/state-reporting-assessments</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
          <article-title>MPH helps Indiana fight COVID-19 with data</article-title>
          <source>State of Indiana</source>
          <access-date>2021-07-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.in.gov/mph/1194.htm">https://www.in.gov/mph/1194.htm</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ripley</surname>
              <given-names>BD</given-names>
            </name>
          </person-group>
          <article-title>The R Project in Statistical Computing</article-title>
          <source>MSOR Connections</source>
          <year>2001</year>
          <month>02</month>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>23</fpage>
          <lpage>25</lpage>
          <pub-id pub-id-type="doi">10.11120/msor.2001.01010023</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maxmen</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Why the United States is having a coronavirus data crisis</article-title>
          <source>Nature</source>
          <year>2020</year>
          <month>09</month>
          <volume>585</volume>
          <issue>7823</issue>
          <fpage>13</fpage>
          <lpage>14</lpage>
          <pub-id pub-id-type="doi">10.1038/d41586-020-02478-z</pub-id>
          <pub-id pub-id-type="medline">32843755</pub-id>
          <pub-id pub-id-type="pii">10.1038/d41586-020-02478-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yoshida</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hara</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Global stability of a delayed SIR epidemic model with density dependent birth and death rates</article-title>
          <source>J Comput Appl Math</source>
          <year>2007</year>
          <month>04</month>
          <day>23</day>
          <volume>201</volume>
          <issue>2</issue>
          <fpage>339</fpage>
          <lpage>347</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1136/bmj.f4147.[published"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.cam.2005.12.034</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>DrugTherapeutics Bulletin</collab>
          </person-group>
          <article-title>An introduction to patient decision aids</article-title>
          <source>BMJ</source>
          <year>2013</year>
          <month>07</month>
          <day>23</day>
          <volume>347</volume>
          <fpage>f4147</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1136/bmj.f4147.[published"/>
          </comment>
          <pub-id pub-id-type="medline">23881944</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Giordano</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Blanchini</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Bruno</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Colaneri</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Di Filippo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Di Matteo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Colaneri</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Modelling the COVID-19 epidemic and implementation of population-wide interventions in Italy</article-title>
          <source>Nat Med</source>
          <year>2020</year>
          <month>06</month>
          <volume>26</volume>
          <issue>6</issue>
          <fpage>855</fpage>
          <lpage>860</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32322102"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41591-020-0883-7</pub-id>
          <pub-id pub-id-type="medline">32322102</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-020-0883-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC7175834</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Musa</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>A conceptual model for the coronavirus disease 2019 (COVID-19) outbreak in Wuhan, China with individual reaction and governmental action</article-title>
          <source>Int J Infect Dis</source>
          <year>2020</year>
          <month>04</month>
          <volume>93</volume>
          <fpage>211</fpage>
          <lpage>216</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1201-9712(20)30117-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijid.2020.02.058</pub-id>
          <pub-id pub-id-type="medline">32145465</pub-id>
          <pub-id pub-id-type="pii">S1201-9712(20)30117-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC7102659</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Casella</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Can the COVID-19 epidemic be controlled on the basis of daily test reports? 2020</article-title>
          <source>Astrophysics Data System</source>
          <year>2020</year>
          <access-date>2020-03-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ui.adsabs.harvard.edu/abs/2020arXiv200306967C">https://ui.adsabs.harvard.edu/abs/2020arXiv200306967C</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="web">
          <article-title>COVID-19: Activity Level by Region and County</article-title>
          <source>Wisconsin Department of Health Services</source>
          <access-date>2021-07-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.dhs.wisconsin.gov/covid-19/disease.htm">https://www.dhs.wisconsin.gov/covid-19/disease.htm</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dobbin</surname>
              <given-names>KK</given-names>
            </name>
            <name name-style="western">
              <surname>Simon</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Optimally splitting cases for training and testing high dimensional classifiers</article-title>
          <source>BMC Med Genomics</source>
          <year>2011</year>
          <month>04</month>
          <day>08</day>
          <volume>4</volume>
          <fpage>31</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedgenomics.biomedcentral.com/articles/10.1186/1755-8794-4-31"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1755-8794-4-31</pub-id>
          <pub-id pub-id-type="medline">21477282</pub-id>
          <pub-id pub-id-type="pii">1755-8794-4-31</pub-id>
          <pub-id pub-id-type="pmcid">PMC3090739</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Kaufman</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Ricketts</surname>
              <given-names>TC</given-names>
            </name>
          </person-group>
          <article-title>Defining urban and rural areas in U.S. epidemiologic studies</article-title>
          <source>J Urban Health</source>
          <year>2006</year>
          <month>03</month>
          <volume>83</volume>
          <issue>2</issue>
          <fpage>162</fpage>
          <lpage>175</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/16736366"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11524-005-9016-3</pub-id>
          <pub-id pub-id-type="medline">16736366</pub-id>
          <pub-id pub-id-type="pmcid">PMC2527174</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Krawczyk</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Learning from imbalanced data: open challenges and future directions</article-title>
          <source>Prog Artif Intell</source>
          <year>2016</year>
          <month>4</month>
          <day>22</day>
          <volume>5</volume>
          <issue>4</issue>
          <fpage>221</fpage>
          <lpage>232</lpage>
          <pub-id pub-id-type="doi">10.1007/s13748-016-0094-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kasthurirathne</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Grannis</surname>
              <given-names>SJ</given-names>
            </name>
          </person-group>
          <article-title>Machine Learning Approaches to Identify Nicknames from A Statewide Health Information Exchange</article-title>
          <source>AMIA Jt Summits Transl Sci Proc</source>
          <year>2019</year>
          <volume>2019</volume>
          <fpage>639</fpage>
          <lpage>647</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31259019"/>
          </comment>
          <pub-id pub-id-type="medline">31259019</pub-id>
          <pub-id pub-id-type="pmcid">PMC6568128</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khakharia</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Jain</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tiwari</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Daphal</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Warang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mehendale</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Outbreak Prediction of COVID-19 Patients for Dense and Populated Countries Using Machine Learning</article-title>
          <source>SSRN Journal</source>
          <year>2020</year>
          <pub-id pub-id-type="doi">10.2139/ssrn.3655759</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maragakis</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Coronavirus Second Wave? Why Cases Increase</article-title>
          <source>Johns Hopkins Medicine</source>
          <access-date>2021-07-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.hopkinsmedicine.org/health/conditions-and-diseases/coronavirus/first-and-second-waves-of-coronavirus">https://www.hopkinsmedicine.org/health/conditions-and-diseases/coronavirus/first-and-second-waves-of-coronavirus</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="web">
          <article-title>Each State’s COVID-19 Reopening and Reclosing Plans and Mask Requirements</article-title>
          <source>National Academy for State Health Policy</source>
          <access-date>2021-02-22</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nashp.org/governors-prioritize-health-for-all/">https://www.nashp.org/governors-prioritize-health-for-all/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Molina</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Understanding transmission and intervention for the COVID-19 pandemic in the United States</article-title>
          <source>Sci Total Environ</source>
          <year>2020</year>
          <month>12</month>
          <day>15</day>
          <volume>748</volume>
          <fpage>141560</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32798884"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.scitotenv.2020.141560</pub-id>
          <pub-id pub-id-type="medline">32798884</pub-id>
          <pub-id pub-id-type="pii">S0048-9697(20)35089-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC7413050</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lutz</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Huynh</surname>
              <given-names>MP</given-names>
            </name>
            <name name-style="western">
              <surname>Schroeder</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Anyatonwu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dahlgren</surname>
              <given-names>FS</given-names>
            </name>
            <name name-style="western">
              <surname>Danyluk</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Fernandez</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Greene</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Kipshidze</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mgbere</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>McHugh</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Myers</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Siniscalchi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>West</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Johansson</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Biggerstaff</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Applying infectious disease forecasting to public health: a path forward using influenza forecasting examples</article-title>
          <source>BMC Public Health</source>
          <year>2019</year>
          <month>12</month>
          <day>10</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>1659</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpublichealth.biomedcentral.com/articles/10.1186/s12889-019-7966-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12889-019-7966-8</pub-id>
          <pub-id pub-id-type="medline">31823751</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12889-019-7966-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC6902553</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
