<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<?covid-19-tdm?>
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v23i6e28253</article-id>
      <article-id pub-id-type="pmid">33900934</article-id>
      <article-id pub-id-type="doi">10.2196/28253</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Quantifying Online News Media Coverage of the COVID-19 Pandemic: Text Mining Study and Resource</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Basch</surname>
            <given-names>Corey</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Huang</surname>
            <given-names>Jian</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Chen</surname>
            <given-names>Bin</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Krawczyk</surname>
            <given-names>Konrad</given-names>
          </name>
          <degrees>DPhil</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Mathematics and Computer Science</institution>
            <institution>University of Southern Denmark</institution>
            <addr-line>Campusvej 55</addr-line>
            <addr-line>Odense, DK-5230</addr-line>
            <country>Denmark</country>
            <phone>45 6550 2387</phone>
            <email>konradk@imada.sdu.dk</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2012-0803</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Chelkowski</surname>
            <given-names>Tadeusz</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0297-3650</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Laydon</surname>
            <given-names>Daniel J</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4270-3321</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Mishra</surname>
            <given-names>Swapnil</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8759-5902</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Xifara</surname>
            <given-names>Denise</given-names>
          </name>
          <degrees>DPhil</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5529-8033</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Gibert</surname>
            <given-names>Benjamin</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8457-3137</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Flaxman</surname>
            <given-names>Seth</given-names>
          </name>
          <degrees>DPhil</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2477-4217</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Mellan</surname>
            <given-names>Thomas</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4185-9930</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Schwämmle</surname>
            <given-names>Veit</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9708-6722</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Röttger</surname>
            <given-names>Richard</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4490-5947</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author">
          <name name-style="western">
            <surname>Hadsund</surname>
            <given-names>Johannes T</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1185-6694</ext-link>
        </contrib>
        <contrib id="contrib12" contrib-type="author">
          <name name-style="western">
            <surname>Bhatt</surname>
            <given-names>Samir</given-names>
          </name>
          <degrees>DPhil</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0891-4611</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Mathematics and Computer Science</institution>
        <institution>University of Southern Denmark</institution>
        <addr-line>Odense</addr-line>
        <country>Denmark</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Management in the Network Society</institution>
        <institution>Kozminski University</institution>
        <addr-line>Warsaw</addr-line>
        <country>Poland</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Infectious Disease Epidemiology</institution>
        <institution>MRC Centre for Global Infectious Disease Analysis</institution>
        <institution>Imperial College London</institution>
        <addr-line>London</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Nupinion</institution>
        <addr-line>London</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Department of Mathematics</institution>
        <institution>Imperial College London</institution>
        <addr-line>London</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Department of Biochemistry and Molecular Biology</institution>
        <institution>University of Southern Denmark</institution>
        <addr-line>Odense</addr-line>
        <country>Denmark</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Section of Epidemiology</institution>
        <institution>Department of Public Health</institution>
        <institution>University of Copenhagen</institution>
        <addr-line>Copenhagen</addr-line>
        <country>Denmark</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Konrad Krawczyk <email>konradk@imada.sdu.dk</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>6</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>2</day>
        <month>6</month>
        <year>2021</year>
      </pub-date>
      <volume>23</volume>
      <issue>6</issue>
      <elocation-id>e28253</elocation-id>
      <history>
        <date date-type="received">
          <day>28</day>
          <month>2</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>1</day>
          <month>4</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>18</day>
          <month>4</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>18</day>
          <month>4</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Konrad Krawczyk, Tadeusz Chelkowski, Daniel J Laydon, Swapnil Mishra, Denise Xifara, Benjamin Gibert, Seth Flaxman, Thomas Mellan, Veit Schwämmle, Richard Röttger, Johannes T Hadsund, Samir Bhatt. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 02.06.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2021/6/e28253" xlink:type="simple"/>
      <related-article related-article-type="correction-forward" xlink:title="This is a corrected version. See correction statement in:" xlink:href="https://www.jmir.org/2021/7/e31544/" vol="23" page="e31544"> </related-article>

      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Before the advent of an effective vaccine, nonpharmaceutical interventions, such as mask-wearing, social distancing, and lockdowns, have been the primary measures to combat the COVID-19 pandemic. Such measures are highly effective when there is high population-wide adherence, which requires information on current risks posed by the pandemic alongside a clear exposition of the rules and guidelines in place.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>Here we analyzed online news media coverage of COVID-19. We quantified the total volume of COVID-19 articles, their sentiment polarization, and leading subtopics to act as a reference to inform future communication strategies.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We collected 26 million news articles from the front pages of 172 major online news sources in 11 countries (available online at SciRide). Using topic detection, we identified COVID-19–related content to quantify the proportion of total coverage the pandemic received in 2020. The sentiment analysis tool Vader was employed to stratify the emotional polarity of COVID-19 reporting. Further topic detection and sentiment analysis was performed on COVID-19 coverage to reveal the leading themes in pandemic reporting and their respective emotional polarizations.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>We found that COVID-19 coverage accounted for approximately 25.3% of all front-page online news articles between January and October 2020. Sentiment analysis of English-language sources revealed that overall COVID-19 coverage was not exclusively negatively polarized, suggesting wide heterogeneous reporting of the pandemic. Within this heterogenous coverage, 16% of COVID-19 news articles (or 4% of all English-language articles) can be classified as highly negatively polarized, citing issues such as death, fear, or crisis.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The goal of COVID-19 public health communication is to increase understanding of distancing rules and to maximize the impact of governmental policy. The extent to which the quantity and quality of information from different communication channels (eg, social media, government pages, and news) influence public understanding of public health measures remains to be established. Here we conclude that a quarter of all reporting in 2020 covered COVID-19, which is indicative of information overload. In this capacity, our data and analysis form a quantitative basis for informing health communication strategies along traditional news media channels to minimize the risks of COVID-19 while vaccination is rolled out.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>text mining</kwd>
        <kwd>COVID-19</kwd>
        <kwd>infoveillance</kwd>
        <kwd>sentiment analysis</kwd>
        <kwd>public health</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>The emergence of the novel coronavirus SARS-CoV-2 and the resultant disease COVID-19 has resulted in an estimated 2.4 million deaths [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Due to the initial lack of pharmaceutical measures targeting COVID-19, many governments resorted to nonpharmaceutical interventions (NPIs) to control the spread of the pandemic [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. The introduction of NPIs, such as social distancing, mask-wearing, or so-called <italic>lockdowns</italic>, significantly reduced SARS-CoV-2 transmission [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. Therefore, in the absence of effective treatments or widespread rollout of vaccines, NPIs remain an important tool in COVID-19 control [<xref ref-type="bibr" rid="ref9">9</xref>].</p>
      <p>The effectiveness of NPIs is dependent on population-wide adherence to government mandates (eg, social distancing rules, stay-at-home orders, and mask-wearing). Adherence, in turn, is dependent on society’s perception of such measures [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>], which are shaped by print and digital media. Since adherence to NPIs is linked to public understanding of the guidelines, it is crucial for news sources shaping such knowledge to effectively expound the rules to maximize public response. As evidence accumulates, it is expected that guidelines will shift and be clarified. In the digital age, one of the primary information sources for society is online news [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. Effective communication on the current state of the pandemic and prevention guidelines affects how society adheres to and responds to NPIs and, therefore, influences the severity of the pandemic.</p>
      <p>News articles have been previously shown to be an effective way of tracking disease outbreaks, with services such as HealthMap contributing to detecting and tracking disease outbreaks [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. Even if only by virtue of its unprecedented scale, news media has been particularly important in the COVID-19 pandemic [<xref ref-type="bibr" rid="ref15">15</xref>]. There have been an estimated 38 million English-language articles on COVID-19 [<xref ref-type="bibr" rid="ref16">16</xref>]. It has further been demonstrated that misinformation on COVID-19 has been widespread and influential, both on social media [<xref ref-type="bibr" rid="ref17">17</xref>] and in traditional news sources [<xref ref-type="bibr" rid="ref16">16</xref>]. This can lead to an overload of information that hinders societal response to the pandemic [<xref ref-type="bibr" rid="ref18">18</xref>].</p>
      <p>A particular difficulty of the pandemic is its emotional toll, both from the disease itself and from social distancing measures [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>]. Emotional toll can be investigated quantitatively by sentiment analysis, which calculates emotional polarization of text from negative, through neutral, to positive. Three previous studies have attempted to quantify emotional toll using sentiment analysis of social media conversations on COVID-19 [<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref24">24</xref>]. Counterintuitively, given pandemic subject matter, all three studies of sentiments from COVID-19 conversations on social media showed a higher proportion of positive rather than negative emotions. In contrast, analysis of COVID-19 headlines from 25 English news media sources indicated that 52% of them evoked negative emotions, 30% evoked positive emotions, and 18% evoked neutral emotions [<xref ref-type="bibr" rid="ref25">25</xref>]. News media can shape behavior toward the pandemic and adherence to control measures. Therefore, extensive negative coverage or contradictory information (ie, information overload) could have detrimental effects to both the mental health of individuals and how effectively society responds to control measures [<xref ref-type="bibr" rid="ref26">26</xref>].</p>
      <p>An earlier study on COVID-19 news coverage by Evanega et al [<xref ref-type="bibr" rid="ref16">16</xref>] sourced 38 million English-language COVID-19 articles by keyword search from LexisNexis, which indexes 7 million sources. Quantifying the extent of COVID-19 information requires normalizing the absolute number of articles with respect to the number of contributing sources. Likewise, sentiment of COVID-19 coverage also needs to be analyzed in the context of overall negativity of consumed information. Aslam et al [<xref ref-type="bibr" rid="ref25">25</xref>] analyzed 141,208 COVID-19 headlines, showing that 52% carried negative sentiment. Similar results were reported by Chakraborty and Bose, who collected COVID-19 news articles from GDELT (Global Database of Events, Language, and Tone) and found that pandemic coverage was mostly associated with negative sentiment polarization [<xref ref-type="bibr" rid="ref27">27</xref>]. Though informative, these studies did not contrast COVID-19 sentiment distribution with the sentiment distribution of the sources they originated from. By contextualizing the sentiment distribution of pandemic reporting within that of the overall coverage, it is possible to draw meaningful conclusions on whether the amount of COVID-19 information is indeed more negatively polarized than what news media consumers are exposed to.</p>
      <p>To address the above issues, we collected over 26 million articles from the front pages of 172 major online news sources from 11 countries and compiled these into a reusable database available at SciRide [<xref ref-type="bibr" rid="ref28">28</xref>]. Firstly, we investigated trends in COVID-19 news with respect to all articles that appeared on the front pages in 2020. Secondly, we analyzed whether articles on COVID-19 were more sentiment-polarized compared with other articles. Finally, we analyzed the leading subtopics in COVID-19 coverage and assessed their sentiment polarization. Overall, our work aimed to elucidate the volume and content of news coverage of COVID-19 in traditional media as a basis for data-driven discussion regarding policy communication in the pandemic.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Curation of a Database of Front-Page News Articles</title>
        <p>To assess coverage of COVID-19 and the sentiment it evoked, we analyzed the landing pages from major online news sources in countries with robust media presence. We selected the major online news sources from 11 countries: the United States, the United Kingdom, Canada, Australia, New Zealand, Ireland, Germany, France, Italy, Spain, and Russia. We included an additional <italic>international</italic> category to better reflect the global focus of certain online news sources.</p>
        <p>For each country, the major online news sources were identified by reference to profiles in BBC Media, which is an authority in curating global news source information and lists of news sites with the most traffic and is curated by SimilarWeb. Focusing on major national online news sources, as defined by online visibility, captures some of the main sources in shaping societal knowledge and opinions [<xref ref-type="bibr" rid="ref29">29</xref>]. It should be noted that the focus on online news sources excludes the impact of social media, epistemic communities, and other influences on public perception. However, due to their depth of penetration, political heterogeneity, and reliability, major online news sources provide an excellent proxy of overall public perception.</p>
        <p>For each online news source, we collected the archived front-page snapshots dating back to 2015 via Internet Archive [<xref ref-type="bibr" rid="ref30">30</xref>], cutting off coverage in 2020 at October 15. We used the pre-2020 articles to fine-tune the accuracy of article collection and provide statistics on reporting of certain topics pre–COVID-19. Each front page was sourced for potential news items using a custom-based pipeline we developed (Section 1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). We defined each article as the combination of the metadata elements title and description—sometimes referred to as headline and subheading—that are broadly akin to titles and abstracts in scientific publications [<xref ref-type="bibr" rid="ref31">31</xref>]. Such metadata are reasonably standardized among online news sources and they offer a headline-like summary of the article, typically designed for sharing on social media, making them suitable for topic detection and sentiment analysis. In total, we collected 26,077,939 articles from front pages of 172 online news sources (<xref ref-type="table" rid="table1">Table 1</xref>), with the full list of contributing sources in Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
        <p>Contemporary news sites rapidly change their content, which is spread through multiple sections, so it is difficult to gauge the level of attention received by particular articles. Front pages of news sites should be reliable reflections of the information many users are exposed to, since they are the main points of entry. This is opposed to other article collection strategies, such as RSS (Really Simple Syndication) or downloading the entire website content, that can provide limited control over assessing how many people have actually read any given article [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. Focusing our efforts on articles from landing pages of major online news sources enabled us to assess the number of COVID-19–related articles that a large proportion of online news consumers were exposed to.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Number of online news sources and collected articles per country.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="300"/>
            <col width="350"/>
            <col width="350"/>
            <thead>
              <tr valign="top">
                <td>Country</td>
                <td>Online news sources (N=172), n (%)</td>
                <td>Collected articles (N=26,077,939), n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Canada</td>
                <td>13 (7.5)</td>
                <td>1,269,200 (4.8)</td>
              </tr>
              <tr valign="top">
                <td>Australia</td>
                <td>8 (4.6)</td>
                <td>1,124,859 (4.3)</td>
              </tr>
              <tr valign="top">
                <td>Italy</td>
                <td>13 (7.5)</td>
                <td>1,526,521 (5.8)</td>
              </tr>
              <tr valign="top">
                <td>The United Kingdom</td>
                <td>21 (12.2)</td>
                <td>4,977,792 (19.0)</td>
              </tr>
              <tr valign="top">
                <td>The United States</td>
                <td>33 (19.1)</td>
                <td>4,388,383 (16.8)</td>
              </tr>
              <tr valign="top">
                <td>France</td>
                <td>9 (5.2)</td>
                <td>1,951,608 (7.4)</td>
              </tr>
              <tr valign="top">
                <td>Germany</td>
                <td>18 (10.4)</td>
                <td>2,348,403 (9.0)</td>
              </tr>
              <tr valign="top">
                <td>Ireland</td>
                <td>8 (4.6)</td>
                <td>905,598 (3.4)</td>
              </tr>
              <tr valign="top">
                <td>International</td>
                <td>6 (3.4)</td>
                <td>462,989 (1.7)</td>
              </tr>
              <tr valign="top">
                <td>New Zealand</td>
                <td>5 (2.9)</td>
                <td>651,050 (2.4)</td>
              </tr>
              <tr valign="top">
                <td>Russia</td>
                <td>19 (11.0)</td>
                <td>3,348,825 (12.8)</td>
              </tr>
              <tr valign="top">
                <td>Spain</td>
                <td>19 (11.0)</td>
                <td>3,122,711 (11.9)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Topic Models</title>
        <p>For each article we extracted, we analyzed the text content of the metadata title and description to determine whether the article could be associated with one of the following topics: cat, sport, Merkel, Putin, Johnson, Biden, Trump, cancer, climate, or COVID-19. Non–COVID-19 topics were selected to provide a reference with large expected volumes of coverage (ie, politicians) that cover a wide range of sentiments (еg, <italic>cat</italic> as nonnegative and <italic>cancer</italic> as negative). Each topic was identified on the basis of the keywords presented in <xref ref-type="table" rid="table2">Table 2</xref>. The only normalization we applied to the words for topic identification was case folding, otherwise the words were not stemmed nor lemmatized. Topics that were used solely for sentiment analysis—cat, sport, climate, and cancer—were not identified for non-English online news sources.</p>
        <p>We chose keywords for each topic in order to maximize the precision of topic identification. Because we focused on titles and descriptions, mentions of specific keywords here made it unlikely that they were only tangentially relevant to the article at hand (eg, explicit mentions of politicians’ names). In the case of COVID-19, we tested the extent to which our topic detection misclassified the topic by identifying COVID-19 articles in the pre–COVID-19 era of 2015 to 2019. Out of 21,693,591 articles, only 7375 (0.03%) were erroneously identified as related to COVID-19, demonstrating high precision of the selected keywords. In the majority of cases, misclassifications stemmed from mentions of lockdowns, which were chiefly gun related, but in the case of the United Kingdom, they were even related to a seagull attack on a school. Subsequent subtopic identification stratified the different threads of COVID-19 coverage, providing a wider set of keywords.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Keywords employed for topic detection.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="110"/>
            <col width="180"/>
            <col width="140"/>
            <col width="140"/>
            <col width="140"/>
            <col width="140"/>
            <col width="150"/>
            <col width="0"/>
            <col width="0"/>
            <thead>
              <tr valign="top">
                <td>Topic</td>
                <td colspan="7">Keywords by language</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>English</td>
                <td>German</td>
                <td>French</td>
                <td>Spanish</td>
                <td>Italian</td>
                <td>Russian</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>
                  <bold>COVID-19</bold>
                </td>
                <td colspan="7">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>coronavirus</td>
                <td>coronavirus</td>
                <td>coronavirus</td>
                <td>coronavirus</td>
                <td>coronavirus</td>
                <td>коронавирус</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>covid</td>
                <td>covid</td>
                <td>covid</td>
                <td>covid</td>
                <td>covid</td>
                <td>covid<break/>ковид</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>lockdown</td>
                <td>lockdown</td>
                <td>lockdown<break/>couvre-feu</td>
                <td>lockdown<break/>confinamiento</td>
                <td>lockdown<break/>contenimento</td>
                <td>lockdown<break/>локдаун</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>quarantine</td>
                <td>quarantäne</td>
                <td>quarantaine</td>
                <td>cuarantena</td>
                <td>quarantena</td>
                <td>карантин</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>pandemic</td>
                <td>pandemie</td>
                <td>pandémie</td>
                <td>pandemia</td>
                <td>pandemia</td>
                <td>пандемиа</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>N/A<sup>a</sup></td>
                <td>corona-</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>Merkel</td>
                <td>merkel</td>
                <td>merkel</td>
                <td>merkel</td>
                <td>merkel</td>
                <td>merkel</td>
                <td>merkel<break/>меркел</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>Trump</td>
                <td>trump</td>
                <td>trump</td>
                <td>trump</td>
                <td>trump</td>
                <td>trump</td>
                <td>trump<break/>трамп</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>Biden</td>
                <td>biden</td>
                <td>biden</td>
                <td>biden</td>
                <td>biden</td>
                <td>biden</td>
                <td>biden<break/>байден</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>Johnson</td>
                <td>boris johnson</td>
                <td>boris johnson</td>
                <td>boris johnson</td>
                <td>boris johnson</td>
                <td>boris johnson</td>
                <td>boris johnson<break/>борис джонсон</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>Putin</td>
                <td>putin</td>
                <td>putin</td>
                <td>putin</td>
                <td>putin</td>
                <td>putin</td>
                <td>putin<break/>путин</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <bold>Climate</bold>
                </td>
                <td colspan="8">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>global warming</td>
                <td>—<sup>b</sup></td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>climate change</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>climate crisis</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <bold>Cat</bold>
                </td>
                <td colspan="8">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>cat</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>kitten</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <bold>Sport</bold>
                </td>
                <td colspan="8">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>baseball</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>major league</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>champion's league</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>football</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>nfl</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>premier league</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>basketball</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>soccer</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>nba</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>Cancer</td>
                <td>cancer</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>N/A: not applicable; this keyword, which is specific to the German language because of its compound nature, was only found in German news sources.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>The topics <italic>climate</italic>, <italic>cat</italic>, <italic>sport</italic>, and <italic>cancer</italic> were not identified in non–English-language online news sources, as these were solely employed for sentiment analysis.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>We further identified subtopics within COVID-19 news coverage by a similar keyword-based approach. Since many subtopic words can have several forms (eg, dead, died, and dies), we stemmed the words associated with each subtopic (eg, healthy and healthier are both stemmed to health); these are presented in <xref ref-type="table" rid="table3">Table 3</xref>. An article was identified as pertaining to a subtopic if, after stemming its title and description, a token corresponding to a stemmed keyword in <xref ref-type="table" rid="table3">Table 3</xref> was identified.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>COVID-19 news subtopics.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="390"/>
            <col width="610"/>
            <thead>
              <tr valign="bottom">
                <td>Subtopic<sup>a</sup></td>
                <td>Stemmed keywords</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Case</td>
                <td>case</td>
              </tr>
              <tr valign="top">
                <td>Crisis</td>
                <td>crisi</td>
              </tr>
              <tr valign="top">
                <td>Death</td>
                <td>die, death</td>
              </tr>
              <tr valign="top">
                <td>Disease</td>
                <td>diseas</td>
              </tr>
              <tr valign="top">
                <td>Distancing</td>
                <td>distanc</td>
              </tr>
              <tr valign="top">
                <td>Fear</td>
                <td>fear</td>
              </tr>
              <tr valign="top">
                <td>Health</td>
                <td>health</td>
              </tr>
              <tr valign="top">
                <td>Home</td>
                <td>home</td>
              </tr>
              <tr valign="top">
                <td>Hospital</td>
                <td>hospit</td>
              </tr>
              <tr valign="top">
                <td>Infection</td>
                <td>infect</td>
              </tr>
              <tr valign="top">
                <td>Isolation</td>
                <td>isol</td>
              </tr>
              <tr valign="top">
                <td>Lockdown</td>
                <td>lockdown</td>
              </tr>
              <tr valign="top">
                <td>Mask</td>
                <td>mask</td>
              </tr>
              <tr valign="top">
                <td>Outbreak</td>
                <td>outbreak</td>
              </tr>
              <tr valign="top">
                <td>Quarantine</td>
                <td>quarantin</td>
              </tr>
              <tr valign="top">
                <td>Spread</td>
                <td>spread</td>
              </tr>
              <tr valign="top">
                <td>Symptom</td>
                <td>symptom</td>
              </tr>
              <tr valign="top">
                <td>Test</td>
                <td>test</td>
              </tr>
              <tr valign="top">
                <td>Treatment</td>
                <td>treatment</td>
              </tr>
              <tr valign="top">
                <td>Vaccine</td>
                <td>vaccin</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>Each of the subtopics was identified by the stemmed keywords (ie, stemming).</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Sentiment Analysis of News Articles Using Vader</title>
        <p>We used a well-established sentiment analysis tool, Vader [<xref ref-type="bibr" rid="ref33">33</xref>], to identify emotionally polarized content, which has previously been applied to news media. It is suitable for short snippets of text, such as the titles and descriptions in our metadata. For a given piece of text, Vader provides a compound score between –1 and 1, with –1 being entirely negative, 0 being neutral, and 1 being entirely positive. For instance, the phrase “I find your lack of faith disturbing” offers a Vader score of –0.42, whereas the phrase “I find your lack of faith encouraging” gives a score of 0.5994. In our case, a sentiment score for a single article consists of a Vader compound score for the concatenation of the article title and description.</p>
        <p>Novel topics are associated with many subject-specific keywords and phrases (eg “social distancing” and “lockdown” for COVID-19). Applying sentiment analysis to text with novel keywords can result in software being unable to correctly annotate polarization. We assessed Vader sentiment annotations on articles identified as one of the subtopics in <xref ref-type="table" rid="table3">Table 3</xref>. This revealed an artifact of the tool, wherein “positive coronavirus test” was labeled as emotionally polarized in the positive direction by virtue of the word “positive.” In order to mitigate the effect of this subject-specific misclassification, the words “positive” and “negative,” for symmetry, were removed from articles related to coronavirus testing prior to applying Vader annotation.</p>
      </sec>
      <sec>
        <title>Estimating Topic Polarization: Relative Sentiment Skew</title>
        <p>We examined whether coverage of a given topic was more emotionally polarized than another topic by contrasting their sentiment distributions. Directly comparing topic sentiment distributions between different online news sources is not sound. Different online news sources can be more sensational and negative or toned-down and neutral, which gives radically different sentiment distributions. To address this issue, we calculated whether specific topic coverage was more negative, positive, or neutral relative to other articles within a particular online news source.</p>
        <p>For each article “<italic>a</italic>” (ie, that article’s title and description metadata) in English-language online news sources, we calculated the Vader compound sentiment score <italic>sent(a)</italic>. For all 2020 articles and topics, in a given online news source, we calculated the mean of the Vader compound sentiment scores, denoted as <italic>μ<sub>ONS,TOPIC</sub></italic> (online news source [ONS]; equation 1). As a reference statistic for the distribution of sentiment scores not relating to a topic, we calculated the mean Vader score of the articles from a given online news source that were not identified as a given topic, denoted as <italic>μ<sub>ONS,TOPIC</sub></italic> (equation 2):</p>
        <graphic xlink:href="jmir_v23i6e28253_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        <graphic xlink:href="jmir_v23i6e28253_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        <p>where <italic>ONS</italic> is a particular online news source, <italic>TOPIC</italic> is a topic from <xref ref-type="table" rid="table2">Table 2</xref> or <xref ref-type="table" rid="table3">Table 3</xref>, <italic>ONS(TOPIC)</italic> is the set of articles on a given topic from a particular online news source, and |<italic>ONS<sub>TOPIC</sub></italic>| is the total number of articles on a given topic in that online news source. A set of articles not identified as a given topic from a particular online news source is denoted as <italic>ONS<sub>TOPIC</sub></italic>.</p>
        <p>For each topic in each online news source, we calculated the relative sentiment skew (<italic>rsskew<sub>ONS,TOPIC</sub></italic>) between topic mean sentiment and the mean of all other articles in the given online news source (equation 3).</p>
        <graphic xlink:href="jmir_v23i6e28253_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        <p>Relative sentiment skew is designed to indicate whether the sentiment score distribution of a particular topic is negatively or positively polarized, compared to other articles, for example, where a topic has one positive (score +1) and two negative articles (each with score −1), and there are seven other nontopic articles that are all positive (each with score +1). In this instance, the relative sentiment skew metric <italic>rsskew<sub>ONS,TOPIC</sub></italic> is –1/3 – 7/7 = –1.33, which indicates greater negativity. Note, we do not account for sample size variation, as the denominator is generally very large (ie, in the thousands).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>One-Quarter of 2020 News Coverage Was Pandemic Related, Suggesting Information Overload</title>
        <p>We estimated the extent of COVID-19 coverage in online news media by identifying articles relating to the pandemic and comparing this number to the total number of articles between January and October 2020.</p>
        <p>For each online news source, we performed topic detection, categorizing each article title and description as relating to the coronavirus—topic called COVID-19—if the title and description contained any keyword of a specific set, given in <xref ref-type="table" rid="table2">Table 2</xref>. Keywords for this simplified topic detection model were chosen to maximize the precision and accuracy of content identification in order to avoid cross-contamination with other topics. In English, these keywords included <italic>covid</italic>, <italic>coronavirus</italic>, <italic>lockdown</italic>, <italic>quarantine</italic>, and <italic>pandemic</italic>, but not, for example, <italic>hospital</italic> and <italic>death</italic>. The keywords were adjusted for the six languages that we used in this study: English, German, French, Spanish, Italian, and Russian (<xref ref-type="table" rid="table2">Table 2</xref>).</p>
        <p>COVID-19 featured in 25.3% of the news articles (1,135,561/4,477,867) across the online news sources (<xref rid="figure1" ref-type="fig">Figure 1</xref>). While this proportion varied between countries, it was consistently large, with the lower bound at 20% and the upper bound at 30%. Thus, even using our relatively simple topic detection model, we were able to demonstrate that 2020 online news coverage was dominated by COVID-19.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>The extent of coronavirus coverage in 2020. We calculated the proportion of all COVID-19 articles as the proportion of all front-page articles. Proportions were calculated for each online news source separately and then aggregated at the national level. The green points represent the individual coverage of each online news source. The yellow line in each box represents the median; the upper and lower whiskers represent the 75th and 25th percentiles, respectively. The red dotted line indicates mean proportion across all online news sources.</p>
          </caption>
          <graphic xlink:href="jmir_v23i6e28253_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>To provide a point of reference to coverage of COVID-19, we identified other global topics with regular and topical media presence (<xref ref-type="table" rid="table2">Table 2</xref>). We selected topics such as Donald Trump (Trump), Joe Biden (Biden), Boris Johnson (Johnson), Angela Merkel (Merkel), and Vladimir Putin (Putin). Unsurprisingly, mentions of politicians are most common in their home countries (Figures S1-S5 in Section 2 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) (eg, Vladimir Putin in Russia). Nonetheless, each politician received an order of magnitude less media attention than COVID-19 in 2020. Specifically, mean coverage of COVID-19 across 11 countries was 25.66%, whereas politicians received 2.50% for Trump, 0.45% for Biden, 0.18% for Putin, 0.17% for Johnson, and 0.09% for Merkel. Higher coverage of COVID-19 was also reflected at the national level. Although 2020 was an election year in the United States, <italic>Trump</italic> received a mean of 15.29% of 2020 media mentions in US online news sources, as opposed to 25.91% of mean mentions for COVID-19. Furthermore, US articles in 2020 mentioning both Trump and COVID-19 accounted for a mean coverage of 3.82%.</p>
        <p>To provide temporal perspective on the media attention of COVID-19, we plotted the proportions of global coverage in the period from January to October 2020 (Figure S6 in Section 2 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). COVID-19 attention in 2020 spiked between March and May, coinciding with many countries following the Chinese strategy of lockdown and other distancing measures. Proportion coverage leading up to the second COVID-19 wave in Europe and the United States did not reach levels seen from March to May but did stay above 20% in the regions we considered. These results provide a quantification of the extent of media attention received by COVID-19 across countries and languages, reflecting the global and protracted impact of the pandemic.</p>
      </sec>
      <sec>
        <title>COVID-19 News Sentiment Analysis Suggests Heterogeneity of Coverage</title>
        <p>The emotion that news coverage of COVID-19 evokes is an important factor in a society’s response to the pandemic [<xref ref-type="bibr" rid="ref25">25</xref>]. We addressed this issue by sentiment analysis contrasting emotional polarization of COVID-19 news with that of certain reference topics and all non–COVID-19 articles for each online news source. Such contrast allows us to determine whether sentiment distribution of COVID-19 coverage was polarized compared to reference topics and other online news for a given online news source.</p>
        <p>To quantify the emotional content of news article text, we employed Vader, which has been previously applied to news article analysis [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>] (see Methods section). For each online news source whose primary language was English (91/172, 52.9%), we created Vader annotations for both the title and description of each of its articles. We grouped articles by their annotated topics (<xref ref-type="table" rid="table2">Table 2</xref>) to provide a comparison with COVID-19 sentiments. Politicians—Merkel, Trump, Johnson, Biden, and Putin—were used as reference points for subjects with frequent coverage. We selected four additional topics to offer intuitive reference points on the positive and negative sentiment spectrum: cat, sport, climate, and cancer. The topics <italic>cat</italic> and <italic>sport</italic> were used, as they would not necessarily be associated with negative sentiments. Likewise, the topics of <italic>climate</italic>—identified by the key phrases global warming, climate crisis, and climate change—and <italic>cancer</italic> were used as references that we would expect to be associated with negative emotions. Altogether, individual sentiment annotations for each online news source were grouped by one of the topics: cat, sport, Merkel, Johnson, Biden, Trump, COVID-19, and cancer.</p>
        <p>For each online news source and topic, we calculated the relative sentiment skew statistic (<italic>rsskew<sub>ONS,TOPIC</sub></italic>; see Methods section), which measures the polarization of a given topic within an online news source. We noted how many topics had a negative or positive relative sentiment skew value (<xref ref-type="table" rid="table4">Table 4</xref>). For the nonpolitician non–COVID-19 topics (ie, cat, sport, and cancer), skew was in the expected direction, suggesting that they are appropriate references for assessing sentiment of COVID-19 articles. We noted negative relative sentiment skew values for 74 out of 91 (81%) English-language online news sources. Nonetheless, this observation cannot be taken as evidence of significant negative polarization, as these relative sentiment skew values are not substantially different than <italic>rsskew</italic>=0, which indicates no polarization. The mean relative sentiment skew for COVID was –0.04 (SD 0.07) (<xref ref-type="table" rid="table4">Table 4</xref>). Since cancer and COVID-19 are both diseases and exert a large burden on public health, one might expect their sentiment distributions from online news to be similar. However, COVID-19 sentiment distribution was not as extreme as that of cancer, which was 100% negative per online news source, and had a mean relative sentiment skew of –0.53 (SD 0.12). Perhaps surprisingly, the sentiment distribution for COVID-19 articles was more akin to coverage of climate, which was <italic>a priori</italic> expected to be negative, akin to cancer, or to subjects covering heterogenous topics by virtue of their wide-ranging implications for society, such as politicians (<xref rid="figure2" ref-type="fig">Figure 2</xref>). This, however, can be an indicator of topics being intertwined: since heads of state are responsible for the pandemic response, they can be expected to be mentioned in relation to COVID-19.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>English-language online news sources<sup>a</sup>, with positive (≥0) or negative (&lt;0) relative sentiment skew of 2020 articles on a given topic.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="190"/>
            <col width="240"/>
            <col width="240"/>
            <col width="200"/>
            <col width="130"/>
            <thead>
              <tr valign="top">
                <td>Topic</td>
                <td>Positive online news sources, n (%)</td>
                <td>Negative online news sources, n (%)</td>
                <td>Relative sentiment skew, mean (SD)</td>
                <td>Total articles<sup>b</sup>, n</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Cat (n=87)</td>
                <td>64 (74)</td>
                <td>23 (26)</td>
                <td>0.12 (0.23)</td>
                <td>2746</td>
              </tr>
              <tr valign="top">
                <td>Sport (N=91)</td>
                <td>84 (92)</td>
                <td>7 (8)</td>
                <td>0.12 (0.08)</td>
                <td>63,155</td>
              </tr>
              <tr valign="top">
                <td>Biden (n=90)</td>
                <td>75 (83)</td>
                <td>15 (17)</td>
                <td>0.09 (0.11)</td>
                <td>38,949</td>
              </tr>
              <tr valign="top">
                <td>Johnson (n=90)</td>
                <td>57 (63)</td>
                <td>33 (37)</td>
                <td>0.04 (0.17)</td>
                <td>22,613</td>
              </tr>
              <tr valign="top">
                <td>Merkel (n=79)</td>
                <td>38 (48)</td>
                <td>41 (52)</td>
                <td>–0.01 (0.25)</td>
                <td>2011</td>
              </tr>
              <tr valign="top">
                <td>COVID-19 (N=91)</td>
                <td>17 (19)</td>
                <td>74 (81)</td>
                <td>–0.04 (0.07)</td>
                <td>589,701</td>
              </tr>
              <tr valign="top">
                <td>Climate (N=91)</td>
                <td>38 (42)</td>
                <td>53 (58)</td>
                <td>–0.04 (0.11)</td>
                <td>7195</td>
              </tr>
              <tr valign="top">
                <td>Putin (n=88)</td>
                <td>33 (38)</td>
                <td>55 (63)</td>
                <td>–0.05 (0.23)</td>
                <td>5179</td>
              </tr>
              <tr valign="top">
                <td>Trump (N=91)</td>
                <td>24 (26)</td>
                <td>67 (74)</td>
                <td>–0.06 (0.09)</td>
                <td>157,702</td>
              </tr>
              <tr valign="top">
                <td>Cancer (N=91)</td>
                <td>0 (0)</td>
                <td>91 (100)</td>
                <td>–0.53 (0.12)</td>
                <td>9548</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>We had 91 English-language online news sources in total; however, in cases where it was impossible to identify a certain topic in a given source, it was left out.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>The total number of articles we identified as being associated with a given topic across all online news sources.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Relative sentiment skew (<italic>rrskew</italic>) of COVID-19 coverage. Each article title and description from each English-language online news source (ONS) received a Vader sentiment compound score between –1 and 1 (most negative and most positive, respectively). We noted the difference in mean sentiment for a specific topic and mean sentiment for other 2020 articles in a given online news source (<italic>rsskew<sub>ONS,TOPIC</sub></italic>; see Methods section). The density of the relative sentiment skew is plotted for each topic. Distributions are colored green if their relative sentiment skew was predominantly positive or red if predominantly  negative (<xref ref-type="table" rid="table4">Table 4</xref>). Intensity of the color is scaled by the distance from the red dotted line at 0, which indicates a lack of difference between topic sentiment and all other articles in a given online news source.</p>
          </caption>
          <graphic xlink:href="jmir_v23i6e28253_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>These results suggest that the sentiment of COVID-19 coverage in online news media is heterogeneous and is certainly not as clearly polarized as cancer, though the volume of coverage might play a role (Figure S7 in Section 3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). One explanation could be the all-permeating nature of the pandemic, where it becomes background to most reporting. Therefore, COVID-19 articles cannot all be categorized as fully negative, contrary to the expectation of pandemic subject matter. In fact, on average, they appear to not be polarized in either the positive or negative direction, especially when compared to reference topics. This suggests that coverage of COVID-19 was highly heterogeneous, with many themes contributing to the totality of messaging.</p>
      </sec>
      <sec>
        <title>Highly Sentiment-Negative Subtopics Account for 16% of COVID-19 Coverage, Suggesting Emotional Pressure</title>
        <p>We studied the text content of COVID-19–related title and description metadata to reveal the leading themes associated with heterogeneous pandemic reporting.</p>
        <p>We investigated article subtopics and calculated the most commonly used words and bigrams (ie, consecutive combinations of two words) to demonstrate the most frequent mentions in COVID-19 coverage. For each of the 91 English-language online news sources, we calculated the ranks of single words and bigrams in articles that pertained to COVID-19. The articles were further subdivided within each online news source as negative (Vader score &lt;–0.2; 247,542 articles), positive (Vader score &gt;0.2; 192,643 articles), or all (any Vader score; 589,709 articles). This subdivision aimed to reveal whether certain keywords or bigrams were more frequently associated with differently polarized text. For each subdivision, we averaged the individual online news source ranks of each word and bigram found across all 91 online news sources. In <xref ref-type="table" rid="table5">Table 5</xref> we present the top 20 highest-ranking words and bigrams across all 91 online news sources. Words and bigrams in <xref ref-type="table" rid="table5">Table 5</xref> reveal many themes that are intuitively associated with the coronavirus, such as testing, vaccine, death, etc. In particular, negative articles had unique top words and bigrams that are intuitively associated with negative emotions. In the singletons, these were <italic>death</italic>, <italic>crisi</italic>, and <italic>fear</italic>, while in bigrams these were <italic>covid_crisi</italic>, <italic>covid_death</italic>, <italic>coronavirus_death</italic>, and <italic>death_toll</italic>—note that words are stemmed.</p>
        <p>To calculate the news coverage proportion related to these top themes, we created a constrained set of COVID-19 subtopics, based on the highest-ranking words and bigrams from <xref ref-type="table" rid="table5">Table 5</xref>. We removed terms that pointed to nonspecific coronavirus coverage, such as <italic>COVID</italic>, <italic>coronavirus</italic>, <italic>pandemic</italic>, or <italic>news</italic>. We extended the list of subtopics to include those we did not find in <xref ref-type="table" rid="table5">Table 5</xref> but considered as strongly related to COVID-19 coverage, such as <italic>hospital</italic>, <italic>quarantine</italic>, <italic>symptom</italic>, or <italic>isolation</italic>, with a full list of subtopics in <xref ref-type="table" rid="table3">Table 3</xref>. For each subtopic, we calculated the proportion of COVID-19 coverage per online news source (Figure S8 in Section 4 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) and relative sentiment skew per online news source for the subtopic (Figure S9 in Section 4 of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The means of coverage and sentiments per online news source are plotted against each other in <xref rid="figure3" ref-type="fig">Figure 3</xref>. The subtopics in <xref ref-type="table" rid="table3">Table 3</xref> account for a mean of 67.14% of all COVID-19 articles across English-language online news sources. Of these, the top three are <italic>case</italic>, <italic>lockdown</italic>, and <italic>death</italic>, which account for a mean of 9.29%, 8.56%, and 8.08% of COVID-19 articles, respectively. <xref rid="figure3" ref-type="fig">Figure 3</xref> and Figure S9 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> suggest that out of <italic>case</italic>, <italic>death</italic>, and <italic>lockdown</italic>, only <italic>death</italic> carried a firmly polarized sentiment, with <italic>case</italic> and <italic>lockdown</italic> not being significantly skewed in either positive or negative directions. The words <italic>fear</italic>, <italic>crisis</italic>, and <italic>death</italic> unsurprisingly indicated substantial negative polarization (<xref rid="figure3" ref-type="fig">Figure 3</xref>).</p>
        <p>We analyzed the impact on news sentiment in 2020 of the three most negative subtopics, <italic>fear</italic>, <italic>crisis</italic>, and <italic>death</italic> (<xref rid="figure3" ref-type="fig">Figure 3</xref>). For each online news source, we calculated the mean sentiment of all the 2020 articles after removing articles that mentioned one of those three topics. For all 91 online news sources, removing articles mentioning one of the top three negative topics resulted in a statistically significant—at the level of .05 with Bonferroni correction—shift toward mean positive sentiment (Section 5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). By contrast, removal of all the sentiment-heterogeneous (<xref rid="figure2" ref-type="fig">Figure 2</xref>) articles from all 2020 articles resulted in a significant shift toward mean positive sentiment in 40 out of 91 (44%) online news sources, a significant shift toward mean negative sentiment for 11 out of 91 (12%) online news sources, and no statistically significant result for 39 out of 91 (43%) online news sources. Altogether, articles mentioning <italic>fear</italic>, <italic>crisis</italic>, and <italic>death</italic> accounted for a mean of 16% of COVID-19 articles across 91 online news sources; due to their highly polarizing nature, they may play a significant role in shaping societal perception of the pandemic.</p>
        <p>Of the three most negative topics, <italic>fear</italic>, <italic>crisis</italic>, or <italic>death</italic>, the latter was the most frequently mentioned for COVID-19 (<xref rid="figure3" ref-type="fig">Figure 3</xref>). In total, <italic>death</italic> was mentioned in the context of COVID-19 in 2.33% of all coverage in 91 English-language online news sources. All <italic>death</italic> mentions in 2020 in 91 English-language online news sources accounted for a mean coverage of 5.74%, whereas in the pre–COVID-19 period of 2015 to 2019, they accounted for 4.07%. Therefore, we can identify that <italic>death</italic> in the context of COVID-19 constituted a significant proportion of negatively associated coverage that appears to have contributed to overall death reporting in the news.</p>
        <p>These results demonstrate that even though the overall coverage of COVID-19 in 2020 was not significantly polarized by sentiment, there was a nontrivial proportion of negative news that contributed to overall reporting negativity in 2020.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Top words and bigrams in English-language countries.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="150"/>
            <col width="270"/>
            <col width="270"/>
            <col width="280"/>
            <col width="0"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Rank</td>
                <td colspan="4">Words and bigrams by polarization<sup>a</sup></td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <break/>
                </td>
                <td>Negative</td>
                <td>All</td>
                <td>Positive</td>
                <td>
                  <break/>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="6">
                  <bold>Single words</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1</td>
                <td>coronavirus</td>
                <td>coronavirus</td>
                <td>coronavirus</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2</td>
                <td>covid</td>
                <td>covid</td>
                <td>covid</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>3</td>
                <td>pandem</td>
                <td>pandem</td>
                <td>pandem</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>4</td>
                <td>new</td>
                <td>new</td>
                <td>new</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>5</td>
                <td>peopl</td>
                <td>peopl</td>
                <td>help<sup>b</sup></td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>6</td>
                <td>say</td>
                <td>case</td>
                <td>say</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>7</td>
                <td>crisi<sup>b</sup></td>
                <td>say</td>
                <td>peopl</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>8</td>
                <td>health</td>
                <td>health</td>
                <td>test</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>9</td>
                <td>case</td>
                <td>test</td>
                <td>health</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>10</td>
                <td>death<sup>b</sup></td>
                <td>outbreak</td>
                <td>case</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>11</td>
                <td>outbreak</td>
                <td>week</td>
                <td>us</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>12</td>
                <td>virus</td>
                <td>us</td>
                <td>home</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>13</td>
                <td>test</td>
                <td>virus</td>
                <td>week</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>14</td>
                <td>could</td>
                <td>could</td>
                <td>one</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>15</td>
                <td>govern</td>
                <td>day</td>
                <td>time</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>16</td>
                <td>us</td>
                <td>one</td>
                <td>day</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>17</td>
                <td>countri</td>
                <td>govern</td>
                <td>govern</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>18</td>
                <td>one</td>
                <td>home</td>
                <td>could</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>19</td>
                <td>week</td>
                <td>countri</td>
                <td>work<sup>b</sup></td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>20</td>
                <td>fear<sup>b</sup></td>
                <td>time</td>
                <td>outbreak</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Bigrams</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>1</td>
                <td>coronavirus_pandem</td>
                <td>coronavirus_pandem</td>
                <td>case_covid</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>2</td>
                <td>coronavirus_crisi</td>
                <td>case_coronavirus</td>
                <td>coronavirus_pandem</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>3</td>
                <td>coronavirus_outbreak</td>
                <td>case_covid</td>
                <td>posit_test</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>4</td>
                <td>health_public</td>
                <td>coronavirus_spread</td>
                <td>health_public</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>5</td>
                <td>posit_test</td>
                <td>distanc_social</td>
                <td>coronavirus_outbreak</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>6</td>
                <td>case_coronavirus</td>
                <td>health_public</td>
                <td>case_coronavirus</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>7</td>
                <td>coronavirus_spread</td>
                <td>covid_test</td>
                <td>covid_pandem</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>8</td>
                <td>coronavirus_new</td>
                <td>coronavirus_outbreak</td>
                <td>distanc_social</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>9</td>
                <td>case_covid</td>
                <td>covid_pandem</td>
                <td>coronavirus_lockdown<sup>b</sup></td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>10</td>
                <td>distanc_social</td>
                <td>coronavirus_new</td>
                <td>coronavirus_spread</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>11</td>
                <td>covid_crisi<sup>b</sup></td>
                <td>coronavirus_crisi</td>
                <td>covid_test</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>12</td>
                <td>covid_test</td>
                <td>case_new<sup>b</sup></td>
                <td>covid_vaccin<sup>b</sup></td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>13</td>
                <td>covid_pandem</td>
                <td>covid_outbreak</td>
                <td>home_stay</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>14</td>
                <td>coronavirus_due<sup>b</sup></td>
                <td>posit_test</td>
                <td>coronavirus_test<sup>b</sup></td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>15</td>
                <td>covid_death<sup>b</sup></td>
                <td>minist_prime</td>
                <td>covid_posit<sup>b</sup></td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>16</td>
                <td>second_wave<sup>b</sup></td>
                <td>home_stay</td>
                <td>minist_prime</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>17</td>
                <td>death_toll<sup>b</sup></td>
                <td>first_time<sup>b</sup></td>
                <td>like_look<sup>b</sup></td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>18</td>
                <td>coronavirus_death<sup>b</sup></td>
                <td>around_world<sup>b</sup></td>
                <td>covid_outbreak</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>19</td>
                <td>amid_coronavirus<sup>b</sup></td>
                <td>covid_spread<sup>b</sup></td>
                <td>coronavirus_new</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>20</td>
                <td>two_week</td>
                <td>two_week</td>
                <td>coronavirus_vaccin<sup>b</sup></td>
                <td>
                  <break/>
                </td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>For each of the 91 English-language online news sources, we calculated the most common words and bigrams and grouped these by Vader scores: &gt;0.2 for positive, &lt;–0.2 for negative, and any score for all. We averaged the ranks of words and bigrams across all online news sources, and here we present the top 20 for each subdivision. The words in the table are stemmed.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>These entries indicate elements that can be found in the top 20, only in the specific subdivisions of <italic>positive</italic>, <italic>all</italic>, or <italic>negative</italic>.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>COVID-19 subtopic coverage and sentiment means. We calculated the mean coverage and mean sentiment of each subtopic. Coverage is expressed as the mean of ratios of subtopics in a given online news source against all COVID-19 articles in the same online news source. Sentiment is the mean of the subtopic relative sentiment skew for all online news sources. The shaded areas illustrate regions with relative sentiment skew above 0.2 (green), between 0.2 and –0.2 (white), and below –0.2 (green).</p>
          </caption>
          <graphic xlink:href="jmir_v23i6e28253_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>In this work, we compiled the largest data set on COVID-19 news, collating over 26 million articles from the front pages of 172 major online news sources from 11 countries. We have made this database publicly available at SciRide [<xref ref-type="bibr" rid="ref28">28</xref>]. We first investigated trends in COVID-19–related news with respect to all front-page articles in 2020. We next used sentiment analysis to determine whether COVID-19 coverage was more polarized than other topics. Finally, we analyzed the leading subtopics in COVID-19 coverage and assessed their sentiment polarization. We demonstrated that 25% of front-page articles in traditional news media between January and October 2020 concerned COVID-19. Sentiment analysis demonstrated that pandemic coverage cannot be simply categorized as negatively polarized by virtue of disease association, pointing to heterogenous reporting. However, there was an increased incidence in reporting of negatively associated topics, in particular concerning <italic>death</italic>. Our results provide a data-driven foundation on policy communication surrounding distancing measures.</p>
      <p>NPIs are drastic measures that reduce casualties before vaccinations and/or treatment regimens become widespread. Such methods, however, are only effective with societal adherence. Information received by a population in times of a pandemic shapes collective adherence to policies introduced to stem its spread. Currently, the internet is the primary source of health information for people in developed countries [<xref ref-type="bibr" rid="ref35">35</xref>].</p>
      <p>Comprehensive analysis of COVID-19 information received by a population would require thorough analysis of all possible internet news sources and all users’ exposure to each piece of information received. The online ecosystem is extremely heterogeneous, with channels of information discovery spread across traditional news sites, blogs, social media, and many others. Within each of such platforms, information itself can take different forms (eg, text length and format). How users interact with the information also has a great effect on the amount of attention a given piece of information receives and the degree of influence it has (eg, extent of sharing on social media or a more visible position on a website). Analysis of COVID-19 information from all online sources is not tractable.</p>
      <p>Direct access to major news sites accounts for 76% of media consumption online [<xref ref-type="bibr" rid="ref29">29</xref>]. The landing pages of such outlets implicitly capture articles that might have been seen by online users. Thus, our analysis of content from front pages of major news sites should encompass a significant proportion of sources shaping knowledge of the pandemic covering reporting across different languages and geographies. In total, we curated a data set of 26 million articles from 172 major web traffic–generating online news sources in 11 countries.</p>
      <p>We identified COVID-19–relevant articles as well as a selection of other topics to serve as reference points for both coverage volume and sentiment analysis. As a standardized common denominator among articles, we analyzed the metadata titles and descriptions, where the main subject matter can be expected to be referenced. We employed a facile topic identification method using a limited set of keyword mentions. We chose a limited number of keywords to make it unlikely that an article would not make the corresponding topic its subject matter if it were referenced in its metadata title and description (eg, politician’s name). This avoided the caveat of tangential references to certain topics mentioned in the full article body or ambiguities that might arise by using more sophisticated topic modeling algorithms [<xref ref-type="bibr" rid="ref36">36</xref>]. Unlike more complex topic modeling methods, or even using a wider set of keywords, our approach did not capture much more subtle references to these topics, and so we will have underestimated total coverage.</p>
      <p>Nonetheless, even using our simple approach, we still identified a nontrivial number of COVID-19 articles on the front pages of our online news sources. We estimate that a mean of 25% of our sample of front-page articles from 11 countries in 2020 mentioned COVID-19 in their titles and descriptions. Our method had reduced topic identification recall by not accounting for more subtle references to COVID-19, and the totality of the articles was certainly contaminated by retrieval of erroneous links that were not actual news articles. Therefore, the actual proportion of articles on the front pages of news sources referencing COVID-19 might have indeed been higher. We envision that the amount of reporting on a topic of general interest like COVID-19 needs to be balanced. Too little information might leave the population underinformed and ill-equipped to respond appropriately. Too much coverage risks obscuring information that is crucial for individuals to understand the pandemic and how to stay safe.</p>
      <p>Reporting on the pandemic could have wider implications than only its basic informative function. It is unknown what effect regular reporting on cases, casualties, and containment methods could have on adherence to distancing rules or mental health [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref37">37</xref>-<xref ref-type="bibr" rid="ref40">40</xref>]. Though current sentiment analysis methods fall short of identifying complex nuance, they offer a good approximation for the position of text on the emotional spectrum (ie, negative, neutral, or positive). By employing sentiment analysis, we found that overall COVID-19 reporting was not markedly polarized in either a positive or negative direction, as opposed to cancer. It is contrary to what might be expected by virtue of the pandemic subject matter, suggesting heterogeneity in reporting. Such heterogeneity might be due to the sheer scale of the pandemic, the consequences of which have permeated much of everyday life. Nevertheless, we found that negatively polarized COVID-19 articles mentioning death, fear, and crisis accounted for 16% of pandemic articles, with death being most widely referenced. Such a nontrivial volume of negatively associated articles significantly skews the sentiment of 2020 reporting toward the negative direction.</p>
      <p>Our results offer a quantification of COVID-19 reporting that substantiates widespread qualitative observations (eg, the pandemic received an unprecedented amount of media attention). Our analysis offers insights for shaping discussion on health communication in order to maximize the effect of control policies. Our retrospective analysis of health communication during the first two waves indicates signs of information and emotional overload that might have obscured understanding of policy. We hope that our findings will inform how best to communicate so as to minimize the risk of subsequent waves while vaccination regimens are introduced.</p>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Supplementary materials.</p>
        <media xlink:href="jmir_v23i6e28253_app1.docx" xlink:title="DOCX File , 5402 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">GDELT</term>
          <def>
            <p>Global Database of Events, Language, and Tone</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">NIHR</term>
          <def>
            <p>National Institute for Health Research</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">NPI</term>
          <def>
            <p>nonpharmaceutical intervention</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">ONS</term>
          <def>
            <p>online news source</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">RSS</term>
          <def>
            <p>Really Simple Syndication</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">
            <italic>rsskew</italic>
          </term>
          <def>
            <p>relative sentiment skew</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>SB would like to acknowledge the Academy of Medical Sciences, the National Institute for Health Research (NIHR) Biomedical Research Centres, and UK Research and Innovation. DL acknowledges funding from the Vaccine Efficacy Evaluation for Priority Emerging Diseases project (grant NIHR: PR-OD-1017-20002) from the NIHR. We would also like to acknowledge Microsoft AI for Health and Amazon AWS for computing resources.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Pei</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Shaman</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Substantial undocumented infection facilitates the rapid dissemination of novel coronavirus (SARS-CoV-2)</article-title>
          <source>Science</source>
          <year>2020</year>
          <month>05</month>
          <day>01</day>
          <volume>368</volume>
          <issue>6490</issue>
          <fpage>489</fpage>
          <lpage>493</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32179701"/>
          </comment>
          <pub-id pub-id-type="doi">10.1126/science.abb3221</pub-id>
          <pub-id pub-id-type="medline">32179701</pub-id>
          <pub-id pub-id-type="pii">science.abb3221</pub-id>
          <pub-id pub-id-type="pmcid">PMC7164387</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <article-title>Coronavirus disease (COVID-19) weekly epidemiological update and weekly operational update</article-title>
          <source>World Health Organization</source>
          <year>2021</year>
          <access-date>2021-02-25</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/emergencies/diseases/novel-coronavirus-2019/situation-reports">https://www.who.int/emergencies/diseases/novel-coronavirus-2019/situation-reports</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hyafil</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Moriña</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Analysis of the impact of lockdown on the reproduction number of the SARS-Cov-2 in Spain</article-title>
          <source>Gac Sanit</source>
          <year>2020</year>
          <month>05</month>
          <day>23</day>
          <fpage>1</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.gacetasanitaria.org/en-analysis-impact-lockdown-on-reproduction-avance-S0213911120300984"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.gaceta.2020.05.003</pub-id>
          <pub-id pub-id-type="medline">32571528</pub-id>
          <pub-id pub-id-type="pii">S0213-9111(20)30098-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC7245209</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lau</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Khosrawipour</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Kocbach</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mikolajczyk</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schubert</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bania</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Khosrawipour</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>The positive impact of lockdown in Wuhan on containing the COVID-19 outbreak in China</article-title>
          <source>J Travel Med</source>
          <year>2020</year>
          <month>05</month>
          <day>18</day>
          <volume>27</volume>
          <issue>3</issue>
          <fpage>taaa037</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32181488"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jtm/taaa037</pub-id>
          <pub-id pub-id-type="medline">32181488</pub-id>
          <pub-id pub-id-type="pii">5808003</pub-id>
          <pub-id pub-id-type="pmcid">PMC7184469</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Flaxman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gandy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Unwin</surname>
              <given-names>HJT</given-names>
            </name>
            <name name-style="western">
              <surname>Mellan</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Coupland</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Whittaker</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Berah</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Eaton</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Monod</surname>
              <given-names>M</given-names>
            </name>
            <collab>Imperial College COVID-19 Response Team</collab>
            <name name-style="western">
              <surname>Ghani</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Donnelly</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Riley</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Vollmer</surname>
              <given-names>MAC</given-names>
            </name>
            <name name-style="western">
              <surname>Ferguson</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Okell</surname>
              <given-names>LC</given-names>
            </name>
            <name name-style="western">
              <surname>Bhatt</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Estimating the effects of non-pharmaceutical interventions on COVID-19 in Europe</article-title>
          <source>Nature</source>
          <year>2020</year>
          <month>08</month>
          <volume>584</volume>
          <issue>7820</issue>
          <fpage>257</fpage>
          <lpage>261</lpage>
          <pub-id pub-id-type="doi">10.1038/s41586-020-2405-7</pub-id>
          <pub-id pub-id-type="medline">32512579</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41586-020-2405-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dye</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dagpunar</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>The scale and dynamics of COVID-19 epidemics across Europe</article-title>
          <source>R Soc Open Sci</source>
          <year>2020</year>
          <month>11</month>
          <volume>7</volume>
          <issue>11</issue>
          <fpage>201726</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://royalsocietypublishing.org/doi/10.1098/rsos.201726?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub%3dpubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1098/rsos.201726</pub-id>
          <pub-id pub-id-type="medline">33391818</pub-id>
          <pub-id pub-id-type="pii">rsos201726</pub-id>
          <pub-id pub-id-type="pmcid">PMC7735356</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Salje</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tran Kiem</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lefrancq</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Courtejoie</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bosetti</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Paireau</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Andronico</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hozé</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Richet</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dubost</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Le Strat</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lessler</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Levy-Bruhl</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Fontanet</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Opatowski</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Boelle</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Cauchemez</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Estimating the burden of SARS-CoV-2 in France</article-title>
          <source>Science</source>
          <year>2020</year>
          <month>07</month>
          <day>10</day>
          <volume>369</volume>
          <issue>6500</issue>
          <fpage>208</fpage>
          <lpage>211</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32404476"/>
          </comment>
          <pub-id pub-id-type="doi">10.1126/science.abc3517</pub-id>
          <pub-id pub-id-type="medline">32404476</pub-id>
          <pub-id pub-id-type="pii">science.abc3517</pub-id>
          <pub-id pub-id-type="pmcid">PMC7223792</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brauner</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Mindermann</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Johnston</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Salvatier</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gavenčiak</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Stephenson</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Leech</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Mikulik</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Norman</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Monrad</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Besiroglu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ge</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hartwick</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Teh</surname>
              <given-names>YW</given-names>
            </name>
            <name name-style="western">
              <surname>Chindelevitch</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gal</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kulveit</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Inferring the effectiveness of government interventions against COVID-19</article-title>
          <source>Science</source>
          <year>2021</year>
          <month>02</month>
          <day>19</day>
          <volume>371</volume>
          <issue>6531</issue>
          <fpage>eabd9338</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33323424"/>
          </comment>
          <pub-id pub-id-type="doi">10.1126/science.abd9338</pub-id>
          <pub-id pub-id-type="medline">33323424</pub-id>
          <pub-id pub-id-type="pii">science.abd9338</pub-id>
          <pub-id pub-id-type="pmcid">PMC7877495</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Okell</surname>
              <given-names>LC</given-names>
            </name>
            <name name-style="western">
              <surname>Verity</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Watson</surname>
              <given-names>OJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Walker</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Whittaker</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Katzourakis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Donnelly</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Riley</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ghani</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Gandy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Flaxman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ferguson</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Bhatt</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Have deaths from COVID-19 in Europe plateaued due to herd immunity?</article-title>
          <source>Lancet</source>
          <year>2020</year>
          <month>06</month>
          <day>20</day>
          <volume>395</volume>
          <issue>10241</issue>
          <fpage>e110</fpage>
          <lpage>e111</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32534627"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(20)31357-X</pub-id>
          <pub-id pub-id-type="medline">32534627</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(20)31357-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC7289569</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sibley</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Greaves</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Satherley</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Overall</surname>
              <given-names>NC</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>CHJ</given-names>
            </name>
            <name name-style="western">
              <surname>Milojev</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bulbulia</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Osborne</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Milfont</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Houkamau</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Duck</surname>
              <given-names>IM</given-names>
            </name>
            <name name-style="western">
              <surname>Vickers-Jones</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Barlow</surname>
              <given-names>FK</given-names>
            </name>
          </person-group>
          <article-title>Effects of the COVID-19 pandemic and nationwide lockdown on trust, attitudes toward government, and well-being</article-title>
          <source>Am Psychol</source>
          <year>2020</year>
          <volume>75</volume>
          <issue>5</issue>
          <fpage>618</fpage>
          <lpage>630</lpage>
          <pub-id pub-id-type="doi">10.1037/amp0000662</pub-id>
          <pub-id pub-id-type="medline">32496074</pub-id>
          <pub-id pub-id-type="pii">2020-39514-001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Akinwunmi</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>CJP</given-names>
            </name>
            <name name-style="western">
              <surname>Ming</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Health communication through news media during the early stage of the COVID-19 outbreak in China: Digital topic modeling approach</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>04</month>
          <day>28</day>
          <volume>22</volume>
          <issue>4</issue>
          <fpage>e19118</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/4/e19118/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/19118</pub-id>
          <pub-id pub-id-type="medline">32302966</pub-id>
          <pub-id pub-id-type="pii">v22i4e19118</pub-id>
          <pub-id pub-id-type="pmcid">PMC7189789</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Qian</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Information resource orchestration during the COVID-19 pandemic: A study of community lockdowns in China</article-title>
          <source>Int J Inf Manage</source>
          <year>2020</year>
          <month>10</month>
          <volume>54</volume>
          <fpage>102143</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32394997"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijinfomgt.2020.102143</pub-id>
          <pub-id pub-id-type="medline">32394997</pub-id>
          <pub-id pub-id-type="pii">S0268-4012(20)30631-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC7211621</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brownstein</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Freifeld</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Madoff</surname>
              <given-names>LC</given-names>
            </name>
          </person-group>
          <article-title>Digital disease detection — Harnessing the web for public health surveillance</article-title>
          <source>N Engl J Med</source>
          <year>2009</year>
          <month>05</month>
          <day>21</day>
          <volume>360</volume>
          <issue>21</issue>
          <fpage>2153</fpage>
          <lpage>2157</lpage>
          <pub-id pub-id-type="doi">10.1056/nejmp0900702</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Freifeld</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mandl</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Reis</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Brownstein</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>HealthMap: Global infectious disease monitoring through automated classification and visualization of internet media reports</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2008</year>
          <volume>15</volume>
          <issue>2</issue>
          <fpage>150</fpage>
          <lpage>157</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/18096908"/>
          </comment>
          <pub-id pub-id-type="doi">10.1197/jamia.M2544</pub-id>
          <pub-id pub-id-type="medline">18096908</pub-id>
          <pub-id pub-id-type="pii">M2544</pub-id>
          <pub-id pub-id-type="pmcid">PMC2274789</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hamzah</surname>
              <given-names>FAB</given-names>
            </name>
            <name name-style="western">
              <surname>Lau</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Nazri</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ligot</surname>
              <given-names>DV</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Shaib</surname>
              <given-names>MKBM</given-names>
            </name>
            <name name-style="western">
              <surname>Zaidon</surname>
              <given-names>UHB</given-names>
            </name>
            <name name-style="western">
              <surname>Abdullah</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Ongk</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Chewl</surname>
              <given-names>PY</given-names>
            </name>
            <name name-style="western">
              <surname>Salungam</surname>
              <given-names>RE</given-names>
            </name>
          </person-group>
          <article-title>CoronaTracker: World-wide COVID-19 outbreak data analysis and prediction</article-title>
          <source>Bull World Health Organ</source>
          <year>2020</year>
          <month>03</month>
          <day>19</day>
          <fpage>1</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/bulletin/online_first/20-255695.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.2471/blt.20.255695</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Evanega</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lynas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Adams</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Smolenyak</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Coronavirus misinformation: Quantifying sources and themes in the COVID-19 ‘infodemic’</article-title>
          <source>JMIR Preprints.</source>
          <comment>Preprint posted online on October 19, 2020.
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://preprints.jmir.org/preprint/25143"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/preprints.25143</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Madraki</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Grasso</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Otala</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Matthews</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Characterizing and comparing COVID-19 misinformation across languages, countries and platforms</article-title>
          <source>arXiv.</source>
          <comment>Preprint posted online on October 13, 2020.
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/pdf/2010.06455"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Okan</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Bollweg</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Berens</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Hurrelmann</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Bauer</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Schaeffer</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Coronavirus-related health literacy: A cross-sectional study in adults during the COVID-19 infodemic in Germany</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2020</year>
          <month>07</month>
          <day>30</day>
          <volume>17</volume>
          <issue>15</issue>
          <fpage>5503</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph17155503"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph17155503</pub-id>
          <pub-id pub-id-type="medline">32751484</pub-id>
          <pub-id pub-id-type="pii">ijerph17155503</pub-id>
          <pub-id pub-id-type="pmcid">PMC7432052</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tavares Lima</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Moreira de Medeiros Carvalho</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>de Araújo Araruna Silva Lima</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>de Oliveira Nunes</surname>
              <given-names>JVA</given-names>
            </name>
            <name name-style="western">
              <surname>Saraiva</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>de Souza</surname>
              <given-names>RI</given-names>
            </name>
            <name name-style="western">
              <surname>Lima da Silva</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Rolim Neto</surname>
              <given-names>ML</given-names>
            </name>
          </person-group>
          <article-title>The emotional impact of coronavirus 2019-nCoV (new coronavirus disease)</article-title>
          <source>Psychiatry Res</source>
          <year>2020</year>
          <month>05</month>
          <volume>287</volume>
          <fpage>112915</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32199182"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.psychres.2020.112915</pub-id>
          <pub-id pub-id-type="medline">32199182</pub-id>
          <pub-id pub-id-type="pii">S0165-1781(20)30516-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC7195292</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shabahang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Aruguete</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>McCutcheon</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Online health information utilization and online news exposure as predictor of COVID-19 anxiety</article-title>
          <source>N Am J Psychol</source>
          <year>2020</year>
          <month>09</month>
          <day>28</day>
          <volume>22</volume>
          <issue>3</issue>
          <fpage>469</fpage>
          <lpage>482</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchgate.net/profile/Mara-Aruguete-2/publication/344408789_Online_Health_Information_Utilization_and_Online_News_Exposure_as_Predictor_of_COVID19_Anxiety/links/5f72444ca6fdcc008644cc28/Online-Health-Information-Utilization-and-Online-News-Exposure-as-Predictor-of-COVID19-Anxiety.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hamidein</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Hatami</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rezapour</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>How people emotionally respond to the news on COVID-19: An online survey</article-title>
          <source>Basic Clin Neurosci</source>
          <year>2020</year>
          <volume>11</volume>
          <issue>2</issue>
          <fpage>171</fpage>
          <lpage>178</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32855776"/>
          </comment>
          <pub-id pub-id-type="doi">10.32598/bcn.11.covid19.809.2</pub-id>
          <pub-id pub-id-type="medline">32855776</pub-id>
          <pub-id pub-id-type="pii">BCN-11-171</pub-id>
          <pub-id pub-id-type="pmcid">PMC7368107</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hung</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lauren</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Hon</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Birmingham</surname>
              <given-names>WC</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Su</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hon</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Lipsky</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>Social network analysis of COVID-19 sentiments: Application of artificial intelligence</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>08</month>
          <day>18</day>
          <volume>22</volume>
          <issue>8</issue>
          <fpage>e22590</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/8/e22590/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/22590</pub-id>
          <pub-id pub-id-type="medline">32750001</pub-id>
          <pub-id pub-id-type="pii">v22i8e22590</pub-id>
          <pub-id pub-id-type="pmcid">PMC7438102</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Detecting topic and sentiment dynamics due to COVID-19 pandemic using social media</article-title>
          <source>Proceedings of the International Conference on Advanced Data Mining and Applications</source>
          <year>2020</year>
          <conf-name>International Conference on Advanced Data Mining and Applications</conf-name>
          <conf-date>November 12-15, 2020</conf-date>
          <conf-loc>Foshan, China</conf-loc>
          <fpage>610</fpage>
          <lpage>623</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/pdf/2007.02304"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/978-3-030-65390-3_46</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>SU</given-names>
            </name>
            <name name-style="western">
              <surname>Kalra</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>COVID-19 pandemic: A sentiment analysis</article-title>
          <source>Eur Heart J</source>
          <year>2020</year>
          <month>10</month>
          <day>14</day>
          <volume>41</volume>
          <issue>39</issue>
          <fpage>3782</fpage>
          <lpage>3783</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32678890"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/eurheartj/ehaa597</pub-id>
          <pub-id pub-id-type="medline">32678890</pub-id>
          <pub-id pub-id-type="pii">5873149</pub-id>
          <pub-id pub-id-type="pmcid">PMC7454503</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aslam</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Awan</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Syed</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Kashif</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Parveen</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Sentiments and emotions evoked by news headlines of coronavirus disease (COVID-19) outbreak</article-title>
          <source>Humanit Soc Sci Commun</source>
          <year>2020</year>
          <month>07</month>
          <day>08</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nature.com/articles/s41599-020-0523-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1057/s41599-020-0523-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Letter to the editor: Headline stress disorder caused by Netnews during the outbreak of COVID-19</article-title>
          <source>Health Expect</source>
          <year>2020</year>
          <month>04</month>
          <volume>23</volume>
          <issue>2</issue>
          <fpage>259</fpage>
          <lpage>260</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32227627"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/hex.13055</pub-id>
          <pub-id pub-id-type="medline">32227627</pub-id>
          <pub-id pub-id-type="pmcid">PMC7104635</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chakraborty</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bose</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Around the world in 60 days: An exploratory study of impact of COVID-19 on online global news sentiment</article-title>
          <source>J Comput Soc Sci</source>
          <year>2020</year>
          <month>10</month>
          <day>21</day>
          <fpage>1</fpage>
          <lpage>34</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33102926"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s42001-020-00088-3</pub-id>
          <pub-id pub-id-type="medline">33102926</pub-id>
          <pub-id pub-id-type="pii">88</pub-id>
          <pub-id pub-id-type="pmcid">PMC7576103</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Krawczyk</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Volanakis</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <source>SciRide</source>
          <access-date>2021-05-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://sciride.org">http://sciride.org</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Flaxman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Goel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rao</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Filter bubbles, echo chambers, and online news consumption</article-title>
          <source>Public Opin Q</source>
          <year>2016</year>
          <month>03</month>
          <day>22</day>
          <volume>80</volume>
          <issue>S1</issue>
          <fpage>298</fpage>
          <lpage>320</lpage>
          <pub-id pub-id-type="doi">10.1093/poq/nfw006</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="web">
          <source>Internet Archive</source>
          <access-date>2021-05-23</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://web.archive.org/">http://web.archive.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Volanakis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Krawczyk</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>SciRide Finder: A citation-based paradigm in biomedical literature search</article-title>
          <source>Sci Rep</source>
          <year>2018</year>
          <month>04</month>
          <day>18</day>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>6193</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-018-24571-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-018-24571-0</pub-id>
          <pub-id pub-id-type="medline">29670147</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-018-24571-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC5906646</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Trampuš</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Novak</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Internals of an aggregated web news feed</article-title>
          <source>Proceedings of the 15th International Multiconference Information Society</source>
          <year>2012</year>
          <conf-name>15th International Multiconference Information Society</conf-name>
          <conf-date>October 8-12, 2012</conf-date>
          <conf-loc>Ljubljana, Slovenia</conf-loc>
          <fpage>221</fpage>
          <lpage>224</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://library.ijs.si/Stacks/Proceedings/InformationSociety/2012/IS2012_Volume_A.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gilbert</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hutto</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Vader: A parsimonious rule-based model for sentiment analysis of social media text</article-title>
          <source>Proceedings of the 8th International AAAI Conference on Weblogs and Social Media</source>
          <year>2014</year>
          <conf-name>8th International AAAI Conference on Weblogs and Social Media</conf-name>
          <conf-date>June 1-4, 2014</conf-date>
          <conf-loc>Ann Arbor, MI</conf-loc>
          <fpage>216</fpage>
          <lpage>225</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aaai.org/ocs/index.php/ICWSM/ICWSM14/paper/view/8109/8122"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Agarwal</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Sentiment analysis of financial news</article-title>
          <source>Proceedings of the 12th International Conference on Computational Intelligence and Communication Networks</source>
          <year>2020</year>
          <conf-name>12th International Conference on Computational Intelligence and Communication Networks</conf-name>
          <conf-date>September 25-26, 2020</conf-date>
          <conf-loc>Bhimtal, India</conf-loc>
          <fpage>312</fpage>
          <lpage>315</lpage>
          <pub-id pub-id-type="doi">10.1109/cicn49253.2020.9242579</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lemire</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Paré</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Sicotte</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Harvey</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Determinants of internet use as a preferred source of information on personal health</article-title>
          <source>Int J Med Inform</source>
          <year>2008</year>
          <month>11</month>
          <volume>77</volume>
          <issue>11</issue>
          <fpage>723</fpage>
          <lpage>734</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2008.03.002</pub-id>
          <pub-id pub-id-type="medline">18434246</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(08)00039-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gledson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Keane</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Measuring topic homogeneity and its application to dictionary-based word sense disambiguation</article-title>
          <source>Proceedings of the 22nd International Conference on Computational Linguistics</source>
          <year>2008</year>
          <conf-name>22nd International Conference on Computational Linguistics</conf-name>
          <conf-date>August 18-22, 2008</conf-date>
          <conf-loc>Manchester, UK</conf-loc>
          <fpage>273</fpage>
          <lpage>280</lpage>
          <pub-id pub-id-type="doi">10.3115/1599081.1599116</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jobes</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Berman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>O'Carroll</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Eastgard</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Knickmeyer</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>The Kurt Cobain suicide crisis: Perspectives from research, public health, and the news media</article-title>
          <source>Suicide Life Threat Behav</source>
          <year>1996</year>
          <volume>26</volume>
          <issue>3</issue>
          <fpage>260</fpage>
          <lpage>269; discussion 269-271</lpage>
          <pub-id pub-id-type="medline">8897665</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Basil</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Media celebrities and public health: Responses to 'Magic' Johnson's HIV disclosure and its impact on AIDS risk and high-risk behaviors</article-title>
          <source>Health Commun</source>
          <year>1995</year>
          <month>10</month>
          <volume>7</volume>
          <issue>4</issue>
          <fpage>345</fpage>
          <lpage>370</lpage>
          <pub-id pub-id-type="doi">10.1207/s15327027hc0704_4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Berry</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Wharf-Higgins</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Naylor</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>SARS wars: An examination of the quantity and construction of health information in the news media</article-title>
          <source>Health Commun</source>
          <year>2007</year>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>35</fpage>
          <lpage>44</lpage>
          <pub-id pub-id-type="doi">10.1080/10410230701283322</pub-id>
          <pub-id pub-id-type="medline">17461750</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weitz</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>SW</given-names>
            </name>
            <name name-style="western">
              <surname>Eksin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Dushoff</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Awareness-driven behavior changes can shift the shape of epidemics away from peaks and toward plateaus, shoulders, and oscillations</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2020</year>
          <month>12</month>
          <day>22</day>
          <volume>117</volume>
          <issue>51</issue>
          <fpage>32764</fpage>
          <lpage>32771</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33262277"/>
          </comment>
          <pub-id pub-id-type="doi">10.1073/pnas.2009911117</pub-id>
          <pub-id pub-id-type="medline">33262277</pub-id>
          <pub-id pub-id-type="pii">2009911117</pub-id>
          <pub-id pub-id-type="pmcid">PMC7768772</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
