<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<?covid-19-tdm?>
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v25i1e37237</article-id>
      <article-id pub-id-type="pmid">36596215</article-id>
      <article-id pub-id-type="doi">10.2196/37237</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Users’ Reactions to Announced Vaccines Against COVID-19 Before Marketing in France: Analysis of Twitter Posts</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Basch</surname>
            <given-names>Corey</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Luo</surname>
            <given-names>Xiao</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Wawrzuta</surname>
            <given-names>Dominik</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Elbattah</surname>
            <given-names>Mahmoud</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Dupuy-Zini</surname>
            <given-names>Alexandre</given-names>
          </name>
          <degrees>MEng</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4548-753X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Audeh</surname>
            <given-names>Bissan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8550-8724</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Gérardin</surname>
            <given-names>Christel</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9303-6349</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Duclos</surname>
            <given-names>Catherine</given-names>
          </name>
          <degrees>PharmD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8745-378X</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Gagneux-Brunon</surname>
            <given-names>Amandine</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0892-2187</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Bousquet</surname>
            <given-names>Cedric</given-names>
          </name>
          <degrees>PharmD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff5" ref-type="aff">5</xref>
          <address>
            <institution>Service de santé publique et information médicale</institution>
            <institution>Centre Hospitalier Universitaire de Saint Etienne</institution>
            <addr-line>Bâtiment CIM42, Hôpital Nord</addr-line>
            <addr-line>Saint Etienne, 42055</addr-line>
            <country>France</country>
            <phone>33 4 77 12 79 74</phone>
            <email>cedric.bousquet@chu-st-etienne.fr</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9775-2476</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Laboratoire d'Informatique Médicale et d'Ingénierie des connaissances en e-Santé, LIMICS</institution>
        <institution>Sorbonne Université, Université Sorbonne Paris Nord, Institut national de la santé et de la recherche médicale, INSERM</institution>
        <addr-line>Paris</addr-line>
        <country>France</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Institut Pierre Louis d'Epidémiologie et de Santé Publique</institution>
        <institution>Département de médecine interne</institution>
        <institution>Sorbonne Université</institution>
        <addr-line>Paris</addr-line>
        <country>France</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Groupe sur l'Immunité des Muqueuses et Agents Pathogènes</institution>
        <institution>Centre International de Recherche en Infectiologie</institution>
        <institution>University of Lyon</institution>
        <addr-line>Saint Etienne</addr-line>
        <country>France</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Vaccinologie</institution>
        <institution>Centre Hospitalier Universitaire de Saint-Etienne</institution>
        <addr-line>Saint Etienne</addr-line>
        <country>France</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Service de santé publique et information médicale</institution>
        <institution>Centre Hospitalier Universitaire de Saint Etienne</institution>
        <addr-line>Saint Etienne</addr-line>
        <country>France</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Cedric Bousquet <email>cedric.bousquet@chu-st-etienne.fr</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>24</day>
        <month>4</month>
        <year>2023</year>
      </pub-date>
      <volume>25</volume>
      <elocation-id>e37237</elocation-id>
      <history>
        <date date-type="received">
          <day>11</day>
          <month>2</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>19</day>
          <month>3</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>17</day>
          <month>7</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>9</day>
          <month>8</month>
          <year>2022</year>
        </date>
      </history>
      <copyright-statement>©Alexandre Dupuy-Zini, Bissan Audeh, Christel Gérardin, Catherine Duclos, Amandine Gagneux-Brunon, Cedric Bousquet. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 24.04.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2023/1/e37237" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Within a few months, the COVID-19 pandemic had spread to many countries and had been a real challenge for health systems all around the world. This unprecedented crisis has led to a surge of online discussions about potential cures for the disease. Among them, vaccines have been at the heart of the debates and have faced lack of confidence before marketing in France.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to identify and investigate the opinions of French Twitter users on the announced vaccines against COVID-19 through sentiment analysis.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>This study was conducted in 2 phases. First, we filtered a collection of tweets related to COVID-19 available on Twitter from February 2020 to August 2020 with a set of keywords associated with vaccine mistrust using word embeddings. Second, we performed sentiment analysis using deep learning to identify the characteristics of vaccine mistrust. The model was trained on a hand-labeled subset of 4548 tweets.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>A set of 69 relevant keywords were identified as the semantic concept of the word “vaccin” (vaccine in French) and focused mainly on conspiracies, pharmaceutical companies, and alternative treatments. Those keywords enabled us to extract nearly 350,000 tweets in French. The sentiment analysis model achieved 0.75 accuracy. The model then predicted 16% of positive tweets, 41% of negative tweets, and 43% of neutral tweets. This allowed us to explore the semantic concepts of positive and negative tweets and to plot the trends of each sentiment. The main negative rhetoric identified from users’ tweets was that vaccines are perceived as having a political purpose and that COVID-19 is a commercial argument for the pharmaceutical companies.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Twitter might be a useful tool to investigate the arguments for vaccine mistrust because it unveils political criticism contrasting with the usual concerns on adverse drug reactions. As the opposition rhetoric is more consistent and more widely spread than the positive rhetoric, we believe that this research provides effective tools to help health authorities better characterize the risk of vaccine mistrust.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>COVID-19 Vaccines</kwd>
        <kwd>Social Media</kwd>
        <kwd>Deep Learning</kwd>
        <kwd>France</kwd>
        <kwd>Sentiment Analysis</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>COVID-19 and Vaccine Hesitancy</title>
        <p>Since December 2019, the COVID-19 outbreak has led governments to impose a wide range of policies to help contain the effect of the pandemic. In France, after a 55-day total lockdown from March 2020 to May 2020, restrictions were partially lifted during the summer, but they were reinstated as soon as October 2020. COVID-19 vaccines were developed since the first wave of the pandemic. Early, before their development, COVID-19 vaccines had to face the challenge of acceptance, as France is one the most “vaccine-hesitant” countries in general.</p>
        <p>Parallel to the spread of the COVID-19 pandemic, an infodemic was observed. An infodemic is an excess of information including false or misleading information in digital and physical environments during a disease outbreak. Social media may contribute to an infodemic and to the spread of misinformation about vaccines and contribute to decision-making about vaccines. Thus, social media listening may constitute a means to predict attitudes toward a vaccine. Our hypothesis was that analyzing conversations on social media such as Twitter during the first wave of the COVID-19 pandemic could have supported the prediction of attitudes of the French population.</p>
        <p>According to the World Health Organization (WHO), “vaccine hesitancy refers to delay in acceptance or refusal of vaccines despite availability of vaccination services” [<xref ref-type="bibr" rid="ref1">1</xref>]. When vaccines are not available on the market, hesitancy can be substituted by mistrust. For example, “vaccine hesitancy” is relevant for the human papillomavirus (HPV) vaccine when concerns about this vaccine are reported in the literature after it is available on the market.</p>
        <p>Questioning the relevance of vaccines has been a well-established trend in France since the end of the 19th century when the hesitancy turned political. Vaccine hesitancy today still focuses on the opposition to compulsory vaccination, opposition to government intrusion into the practice of medicine, and defense of individual liberties [<xref ref-type="bibr" rid="ref2">2</xref>]. Arguments against vaccines are supported by different actors, and public sensitivity to these ideas has become a major political issue at both national and international levels. In France, a climate of skepticism about vaccines has been fueled by events such as the suspension of the hepatitis B vaccination on suspicion of side effects and the issue of the H1N1 vaccination campaign in which large expenditures were made but the epidemic turned out to be much less intense than expected. Another example that received major attention in the media worldwide is the association between vaccination and autism [<xref ref-type="bibr" rid="ref3">3</xref>] supported by data that were subsequently retracted [<xref ref-type="bibr" rid="ref4">4</xref>]. Before the vaccine rollout, 26% of the French population would refuse to be vaccinated if a vaccine against COVID-19 became available [<xref ref-type="bibr" rid="ref5">5</xref>]. Previous attitudes of vaccine hesitancy were associated with negative opinions toward COVID-19 vaccines [<xref ref-type="bibr" rid="ref6">6</xref>]. Another study conducted by IPSOS from October 8, 2020, to October 13, 2020 [<xref ref-type="bibr" rid="ref7">7</xref>], revealed that, in France, 54% of respondents would get it if the vaccine was available. It was one of the worst scores among 15 countries with an average of 73%. IPSOS [<xref ref-type="bibr" rid="ref7">7</xref>] conducted this study again at the end of 2020, from December 17 to December 20, and showed that the proportion selecting “Totally Agree” fell to 40%. Among 15 countries, France was the most refractory to the vaccine against COVID-19. This was confirmed by a study by Lazarus et al [<xref ref-type="bibr" rid="ref8">8</xref>] that showed only 59% had positive opinions about the vaccine in June 2020.</p>
        <p>In this paper, we explored the content on Twitter with the help of advanced machine learning techniques to identify the barriers and motivations concerning the announced vaccines against COVID-19 in France between January 2020 and August 2020. Our work aimed to assess the characteristics of users’ opinions to identify positive and negative reactions about COVID-19 vaccines and reveal main elements related to vaccine mistrust in the COVID-19 context.</p>
        <p>In this paper, we managed to identify a set of tweets to meet the objective. The added value was as follows: (1) A selection of relevant keywords for the field of anti-COVID vaccines is proposed, which combines the computation of embeddings with FastText and their representation by means of a principal component analysis, and (2) topics are identified in the tweets that could help explain mistrust of vaccines and counter them with negative argument.</p>
      </sec>
      <sec>
        <title>Using Social Media to Monitor Vaccine Resistance</title>
        <p>The period of the COVID-19 crisis favored the publication of numerous surveys of European citizens to assess intentions to vaccinate against COVID-19 and to identify the categories of individuals most susceptible to vaccine resistance [<xref ref-type="bibr" rid="ref9">9</xref>]. These studies were based on controlled statistical methods in which respondents are constrained by a limited number of answers predefined by the investigators [<xref ref-type="bibr" rid="ref10">10</xref>]. As a result, reasons for vaccine hesitancy other than those proposed in the controlled studies cannot be detected. However, the public is exposed to new events on a daily basis, and additional reasons for vaccine mistrust may emerge rapidly and not be captured by static resources.</p>
        <p>Real-time monitoring of social media can be an indicator of society’s hottest emerging issues. As the exhaustive analysis of a large volume of messages is impossible, the use of recent advances in natural language processing (NLP) has become the actual trend. Sentiment and opinion analysis regarding the COVID-19 pandemic benefited from recent automatic approaches to social media analysis. For example, topic modeling was used on Twitter by Wang et al [<xref ref-type="bibr" rid="ref11">11</xref>] to analyze public opinion toward COVID-19 in California and New York and by Luo et al [<xref ref-type="bibr" rid="ref12">12</xref>] who performed a similar analysis on HPV vaccination. Sha et al [<xref ref-type="bibr" rid="ref13">13</xref>] used dynamic topic modeling to track governmental decision-making regarding risk, testing, and treatment based on tweets by US governors and presidential cabinet members. Several infodemiology studies applied machine learning approaches to analyze social media. Daughton et al [<xref ref-type="bibr" rid="ref14">14</xref>] used supervised learning classifiers to identify human behaviors relevant to COVID-19. Similarly, Chen et al [<xref ref-type="bibr" rid="ref15">15</xref>] used dimension reduction and cluster analysis to support comparison between viral COVID-19 posts on Twitter and Sina Weibo, a non-English–speaking platform in China. In some cases, multiple artificial intelligence approaches can be used to construct an observation framework, such as in the study by Adikari et al [<xref ref-type="bibr" rid="ref16">16</xref>] in which a combination of several machine learning approaches, including NLP, word embeddings, and Markov models, was proposed to investigate COVID-19–related emotions.</p>
        <p>Exploring vaccine hesitancy through online posts on social media is inspiring. Although some studies focused on qualitative analysis of a limited number of posts [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>], others employed semiautomatic approaches such as in the study by Massey et al [<xref ref-type="bibr" rid="ref19">19</xref>], which used content and network analysis to study misinformation about the HPV vaccine. Recently, the use of automatic approaches based on NLP has become frequent for quantitative studies about vaccine hesitancy. For example, for sentiment analysis about the HPV vaccine, Skeppstedt et al [<xref ref-type="bibr" rid="ref20">20</xref>] used topic modeling on discussion forums, and Zhang et al [<xref ref-type="bibr" rid="ref21">21</xref>] used transfer learning on Twitter posts. Similar approaches were applied to analyze vaccine hesitancy in the COVID-19 context. Hussain et al [<xref ref-type="bibr" rid="ref22">22</xref>] used deep learning and NLP to analyze public sentiment toward COVID-19 vaccines based on a set of Twitter and Facebook posts from the United Kingdom and the United States. Kwok et al [<xref ref-type="bibr" rid="ref23">23</xref>] used topic models based on latent Dirichlet allocation [<xref ref-type="bibr" rid="ref24">24</xref>] for sentiment analysis about the COVID-19 vaccine among Australian Twitter users. Such studies are specific to the cultural and political context that affected decision-making in vaccination policy.</p>
      </sec>
      <sec>
        <title>Using Pretrained NLP Models to Support Social Media Monitoring</title>
        <p>To our knowledge, most social media studies regarding COVID-19 vaccine hesitancy in France are qualitative and do not benefit from advanced and efficient machine learning.</p>
        <p>There are now many pretrained NLP models available, depending on the languages or texts used during training. Models in English were created to facilitate research, such as COVID-Twitter-BERT [<xref ref-type="bibr" rid="ref25">25</xref>], which is trained on English tweets mentioning the COVID-19 pandemic. Arnaud et al [<xref ref-type="bibr" rid="ref26">26</xref>] described previous work on the French adaptation of Bidirectional Encoder Representations from Transformers (BERT): CamemBERT and FlauBERT. The objective was to perform unsupervised learning, while we focused on supervised learning. Blanc et al [<xref ref-type="bibr" rid="ref27">27</xref>] compared the performances of CamemBERT and FlauBERT to build a chatbot, and Sauvayre et al [<xref ref-type="bibr" rid="ref28">28</xref>] used CamemBERT to classify the opinion of Twitter users on COVID-19 vaccines. The BERT language model is therefore usable for the French language and could be adapted for the classification of tweets.</p>
      </sec>
      <sec>
        <title>Mistrust About COVID-19 Vaccines and the Opportunity With Social Media Listening</title>
        <p>Mistrust about COVID-19 vaccines has spread widely across social media. Consequently, its influence was able to reach a large part of the population. This mistrust situation was causing concern for health authorities, including the WHO, which listed vaccine mistrust as one of the 10 biggest threats for global health in 2019 next to the threat of a pandemic [<xref ref-type="bibr" rid="ref29">29</xref>].</p>
        <p>According to Taylor et al [<xref ref-type="bibr" rid="ref30">30</xref>], there are many reasons for this mistrust: One may be doubtful of the vaccine benefit; there may be concerns about long-term, unexpected side effects; marketing of vaccines may be considered as a mere commercial operation in which vendors are profiteering from patients; and one may prefer natural immunity rather than getting immunity from the vaccine. Other studies have considered conspiracy theories as an element influencing the decision to get vaccinated [<xref ref-type="bibr" rid="ref31">31</xref>]. Examples of these theories in the context of COVID-19 are Bill Gates’ intention to create a “global surveillance state” [<xref ref-type="bibr" rid="ref32">32</xref>] and the economic motivation of the “Big Pharma” vaccine industry [<xref ref-type="bibr" rid="ref33">33</xref>].</p>
        <p>Analyzing social media can facilitate the evaluation of adherence to a potential COVID-19 vaccine. As we mentioned in the Introduction section, part of the population has doubts about the nonauthorization of chloroquine for the treatment of COVID-19. These doubts could have been supported by the highly mediatized “Lancet Gate” in which the WHO urgently stopped trials on chloroquine and hydroxychloroquine as a treatment against COVID-19 based on scientific papers that used corrupted data and were retracted shortly later [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>].</p>
        <p>The high accessibility to social media today highlights that popular news on this resource can reach an important number of people in a short time [<xref ref-type="bibr" rid="ref36">36</xref>]. The general director of the WHO declared in 2020 that the WHO must deal with the infodemic in addition to the pandemic [<xref ref-type="bibr" rid="ref37">37</xref>]. A new report published by the Centre for Countering Digital Hate noted that 31 million people follow antivaccine groups on Facebook, with 17 million people subscribing to similar accounts on YouTube [<xref ref-type="bibr" rid="ref38">38</xref>]. Such accessibility to a large volume of information can help identify public views. However, this resource cannot replace more controlled survey methods because of the inherent selection bias on one hand and the uncontrolled spread of false information via this resource on the other hand [<xref ref-type="bibr" rid="ref39">39</xref>].</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview</title>
        <p>This study was conducted in 2 steps that were designed to be accessible and easily adapted to any other subject at a specific time. The first step consisted of constructing a data set of French tweets related to COVID-19. From this data set, a subset of keywords relative to the word “vaccin” (vaccine in French) was selected by exploring embeddings with a distance close to this word. By restricting the data set to the tweets containing at least one of these keywords, a data set related to the topic of vaccine in French during the COVID-19 pandemic was reached. The second step focused on sentiment analysis. As this part required machine learning, a small part of the restricted data set needed to be hand labeled to fine tune a pretrained model. After training and evaluating the model, label prediction was performed on the whole restricted data set, and the predictions were explored in terms of vocabulary and timeline. These steps are summarized in <xref rid="figure1" ref-type="fig">Figure 1</xref> and explained in detail in the subsections hereafter.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Summary of the study methodology, with the different phases separated by horizontal lines.</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e37237_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Data Collection</title>
        <p>Data were collected before vaccines were available on the market. About 700 million unique tweets were identified by the Panacea Lab team at Georgia State University [<xref ref-type="bibr" rid="ref40">40</xref>] for the period between February 2020 and August 2020 using a selection of keywords that were mainly COVID-19 designation variants, and the corresponding IDs were made available on GitHub. A new version is made available every week and collects approximately 3 million tweets per day. Once restricted to tweets in French, the database has yet to be restricted to the vaccination topic. We did not use Twitter's localization function to verify that the tweets were written in France because the information was often missing.</p>
        <p>The data from the Panacea Lab have the advantage of having been collected constantly since the start of the pandemic using inclusion criteria that can be reproduced over time. Panacea Lab provided a public set of tweet IDs of COVID-19–related tweets. The Twitter application programming interface (API) was needed to get twitter contents based on these IDs. The advantage of using a public, prefiltered data set is the possibility to eventually compare the results to other studies using the same data set.</p>
      </sec>
      <sec>
        <title>Data Refinement Based on Word Embeddings</title>
        <p>Word embeddings are a way of representing a word in the vocabulary in a mathematical space. Words are transformed into vectors of a fixed number of dimensions to embed information about their meaning in the corpus. Thus, words that are close in meaning will be close in distance in this space. The choice of the word embeddings model is based on the properties and specificities of the data, as they influence the performance of the algorithms using them.</p>
        <p>For this purpose, a word embeddings model was trained on the whole French tweet data set to catch emerging words that would not exist in a training data set of pretrained algorithms or pretrained word embedding algorithms.</p>
      </sec>
      <sec>
        <title>Data Set Generation Using a Fine-Tuned FastText Model</title>
        <p>Since the data are composed of short, noisy messages with uncertain spelling, the word embeddings generated by FastText offer significant advantages. Notably, this method is considered to be fast, enables words with a similar spelling to be brought together by using parameter sharing, and can provide better performance when the vocabulary contains many syntactic or orthographic variations of the same word. Most word embedding models learn a vectorial representation from the word’s context, but as FastText also learns additional embeddings at the character level of the word, the decomposition of an unknown word enables it to learn more relevant embeddings for rare words. The aforementioned technique, which is named parameter sharing, is an advantage since most models do not address the diversity of morphologically rich languages such as French. Accurate word representations are difficult to learn since many word forms occur too rarely in the training corpus. Parameter sharing also enables the handling of uncertain spelling observed in tweets.</p>
        <p>As word embedding models come with hyperparameters, tuning FastText is necessary to fit the corpus at best. The metric used for that task is a criterion named the Discounted Cumulative Gain (DCG), which considers a user-defined collection of word pairs that are known to be close in meaning or context and computes the score of the cumulative closeness of the embeddings associated with the pairs. One example was the pair of French words “covid” and “coronavirus.” The list of 24 word pairs in French we used and their translation in English are available in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. The higher the DCG, the more the model is expected to fit the corpus.</p>
        <p>To complete the restriction of the French tweets to a vaccine-centered data set, a semantic field of the French word “vaccin” was built: By iterating from the word “vaccin,” words close in the embedding space were added to the semantic field by computing their distance. This set of keywords is therefore composed of the closest words in distance to the word “vaccin” in the embedded space, truncated with a user-defined threshold. First, we selected a couple of words close to “vaccin.” Then, we used the group of words composed of “vaccine” and its close neighbors to find words that are close to this group. Finally, we iterated by making the group grow by integrating more neighbors until there were no neighbors considering the user-defined threshold. The final restricted data set was then composed of tweets containing at least one of those keywords. These keywords were also used to explore the topics surrounding the vaccination topic using principal component analysis (PCA).</p>
      </sec>
      <sec>
        <title>Data Preprocessing</title>
        <p>Data preprocessing was designed to be as minimal as possible and focused on 2 main tasks. The first was to delete unnecessary information, and the second was to lower the noise in texts.</p>
        <p>First, the following steps were applied to the restricted data set: URLs, punctuation, and special characters were removed. Tweets were then split into lists of lowercased words, and words that did not add any real value to the meaning (stop words) were also removed.</p>
        <p>In addition, some words such as “hydroxychloroquine” have many spelling variations. In order to suppress part of the noise to obtain better performance, a spelling correction step was applied. It consisted of comparing each word to a custom French dictionary and then correcting the 3000 most common mistakes; it could correct approximately 70% of the misspelled words in the corpus. Thus, a dictionary of 3482 words was manually created to correct this noise.</p>
        <p>Finally, 1 Twitter user appeared to likely be a bot by repeatedly posting 3 identical texts mentioning different users each time. It represented a total of 2343 tweets published in a very short period. This user was therefore deleted in order not to bias the results of the study.</p>
      </sec>
      <sec>
        <title>Model Building and Training</title>
        <p>After the preprocessing steps, an extended analysis to explore users’ sentiments about vaccination was initiated using advanced machine learning models. Some pretrained models in French can be adapted to a supervised classification task. We chose transfer learning, which allows learning with a limited amount of data or low computational capacity. Thus, as the model already has a sufficient understanding of the French language, it is not necessary to attain a large quantity of hand-labeled tweets.</p>
        <p>Most recent language models are based on the BERT model [<xref ref-type="bibr" rid="ref41">41</xref>]. As resources trained on tweets mentioning the COVID-19 pandemic are not available in French, it was necessary to fine tune existing models. Several pretrained models are available, with different sizes of architecture that are specific to one or more languages or that are trained on a particular type of text. To use these models for sentiment analysis, we chose to construct a classifier at the output of a BERT-type model to determine which of the classes was the most likely for each tweet. The BERT-type model chosen here was CamemBERT [<xref ref-type="bibr" rid="ref42">42</xref>], to which a linear classification layer was added. This linear layer learns the best multidimensional linear regression to perform on the output of the BERT-type model to obtain the desired predictions. Many other classification layers can be evaluated to improve performance. Moreover, this implies that the training is supervised.</p>
        <p>This study classified tweets into 3 categories: positive, negative, or neutral sentiment. Tweets labeled as positive mentioned the announced vaccine in an optimistic, confident way and often diffused encouraging news on the subject. The negative tweets evoked the potential vaccine in a mistrustful and possibly conspiratorial way, and they sought to warn of its possible risks or manipulation or to relay information spreading doubt about its effectiveness. The neutral ones were unrelated to vaccines or did not contain any judgment about them.</p>
        <p>For training, a total of 4548 tweets (4548/344,000, 1.3% of the restricted data set) were labeled by a single annotator, of which 26.9% (1223/4548) were negative, 21.2% (965/4548) were positive, and 51.9% (2360/4548) were neutral. The classification task was therefore imbalanced, and this had to be addressed by using specific methods. First, a stratified training method was required so that the training and test sets respected the proportion of each class. In order to compare methods, metrics must ensure that each class is best predicted not only as a whole but also class by class. Precision (ratio of predicted items that truly belong to this class) and recall (ratio of correctly predicted items among the known items of this class) were used to measure the performance of our method class by class, in addition to the <italic>F</italic><sub>1</sub>-score, which is their harmonic mean. Accuracy (ratio of correct predictions) is the metric used to give a general appreciation of the performance of the models. As a matter of performance comparison, a common sentiment classification model using a combination of term frequency-inverse document frequency (TF-IDF) and multinomial naïve Bayes was used.</p>
      </sec>
      <sec>
        <title>Implementation</title>
        <p>We used the following Python packages: sklearn, fastText, pytorch, pandas, kedro, and transformers. We used SSH access and Jupyter notebooks on a server consisting of a 28 core/56 thread microprocessor (Intel x64), 256 GB of memory, 1 TB of NVMe (nonvolatile memory express) storage, and 2 Nvidia GPUs of 2432 cuda core each (GeForce GTX 1070 Ti) with a Linux Debian 9.9 operating system (see the Acknowledgments section).</p>
      </sec>
      <sec>
        <title>Ethics Approval</title>
        <p>This study received approval from the ethics committee at the centre hospitalier universitaire de Saint-Etienne under the Institutional review board number 1412020/CHUSTE.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Data Collection Based on Word Embeddings</title>
        <p>The initial data set restricted to French tweets consisted of 894,315 unique words for 4,020,525 tweets. After training word embeddings for 300 dimensions, relations between words were explored, and 69 keywords were identified as the semantic concept of the word “vaccin.” The list of the 69 keywords and their translation in English are available in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
        <p>Using PCA only as a visualization tool, we displayed a projection of the vector representations of each keyword on a shared 2D plan (<xref rid="figure2" ref-type="fig">Figure 2</xref>). This projection seems to group keywords into 3 groups surrounding the word “vaccin,” which could be summarized as potential treatments (top left; eg, antibiotique, antiviraux, artemisia, azithromycin, chloroquine, dexamethasone, hydroxychloroquine, plaquenil, remdesevir, and tocilizumab), conspiracy (bottom left), and pharmaceutical companies (right; eg, AstraZeneca, Gilead, GSK, Moderna, Novartis, Oxford, Pfizer, and Sanofi). The projection of the terms “vaccination” and “vacciner” (to vaccinate) sets these words among the words related to conspiracy theory terms like “charlatan” (charlatan), “cobaye” (guinea pig), “complot” (conspiracy), “conflit” (conflict), “conspiration” (conspiracy), “corrompu” (corrupt), “escroc” (crook), “intérêt” (interest), “lobby” (lobby), “mondialiste” (globalist), “puce” (chip), “théorie” (theory), and “traitre” (traitor), as well as mentions of Bill “Gates” and George “Soros.” Although “vaccination” and “vacciner” have the same root as “vaccin,” the embeddings captured nuances in their contexts. This information already unveils some polarity that is associated with the vocabulary.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>2D projection of the 69 identified keywords, with the starting word “vaccin” in red and “vaccination” and “vacciner” in blue for readability reasons, 3 hand-drawn ellipses highlighting sets of words present in the same area of the figure and showing that elements of a similar nature (eg, mistrust, drugs, or companies) can be grouped together. The addition of ellipses reflects only the interpretation of the authors and is not based on any mathematical theory.</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e37237_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Tweet filtering based on word embeddings provided a specific data set by restricting the collection to 344,000 tweets in French (around 9% of the initial French data set). Filtering based on the “vaccin” word alone would have generated a subset of 75,000 tweets, thus ignoring a large number of tweets potentially related to aspects of vaccine mistrust. The results presented in the rest of this paper concern the 344,000 French tweets related to a potential vaccine against COVID-19.</p>
      </sec>
      <sec>
        <title>Sentiment Analysis Model Evaluation</title>
        <p>To be able to compare the performance of a more complex model using CamemBERT and a linear layer classifier, it is necessary to evaluate very simple models and to know their performances. We chose 2 simple baseline models. Since the classes are very imbalanced in favor of the neutral class, the simplest model is to predict only this neutral class. This first baseline model had an accuracy of 0.52, and any other model must achieve better performances than this. The second baseline model was more meaningful while still being very simple. It combines a document embedding vectorization to TF-IDF features and a classifier named multinomial naïve Bayes. A document embedding is a vector representation of each document, according to the words of which it is composed. It is then used by the classifier to predict 1 of the 3 classes. After training, the metrics of this baseline are summarized in the following table (<xref ref-type="table" rid="table1">Table 1</xref>). Although the precision of the model in predicting a positive or a negative tweet was 0.89 and 0.74 respectively, the recall fell to 0.08 for the positive tweets and 0.53 for the negative tweets. Moreover, the prediction of the neutral class had a high recall of 0.94 but a low precision of 0.58 compared with the precision of positive and negative tweet predictions. Positive and negative tweets seemed to be misclassified into the neutral class, which therefore had a weaker precision. The confusion matrix confirmed those conclusions (<xref rid="figure3" ref-type="fig">Figure 3</xref>).</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Classification summary for term frequency-inverse document frequency (TF-IDF) and multinomial naïve Bayes (MNB), as well as CamemBERT with the linear layer.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="130"/>
            <col width="80"/>
            <col width="210"/>
            <col width="0"/>
            <col width="90"/>
            <col width="200"/>
            <col width="0"/>
            <col width="80"/>
            <col width="210"/>
            <col width="0"/>
            <thead>
              <tr valign="top">
                <td>Classification</td>
                <td colspan="3">Precision</td>
                <td colspan="3">Recall</td>
                <td colspan="2"><italic>F</italic><sub>1</sub>-score</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>MNB</td>
                <td>CamemBERT</td>
                <td colspan="2">MNB</td>
                <td>CamemBERT</td>
                <td colspan="2">MNB</td>
                <td colspan="2">CamemBERT</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Positive</td>
                <td>0.89</td>
                <td>0.64</td>
                <td colspan="2">0.08</td>
                <td>0.73</td>
                <td colspan="2">0.14</td>
                <td colspan="2">0.68</td>
              </tr>
              <tr valign="top">
                <td>Negative</td>
                <td>0.74</td>
                <td>0.75</td>
                <td colspan="2">0.53</td>
                <td>0.77</td>
                <td colspan="2">0.61</td>
                <td colspan="2">0.76</td>
              </tr>
              <tr valign="top">
                <td>Neutral</td>
                <td>0.58</td>
                <td>0.83</td>
                <td colspan="2">0.94</td>
                <td>0.75</td>
                <td colspan="2">0.71</td>
                <td colspan="2">0.78</td>
              </tr>
              <tr valign="top">
                <td>Macro-average</td>
                <td>0.73</td>
                <td>0.74</td>
                <td colspan="2">0.51</td>
                <td>0.75</td>
                <td colspan="2">0.49</td>
                <td colspan="2">0.74</td>
              </tr>
              <tr valign="top">
                <td>Micro-average</td>
                <td>0.70</td>
                <td>0.76</td>
                <td colspan="2">0.62</td>
                <td>0.75</td>
                <td colspan="2">0.56</td>
                <td colspan="2">0.75</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Confusion matrix for term frequency-inverse document frequency (TF-IDF) and multinomial naïve Bayes.</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e37237_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>The performance of the sentiment analysis model proposed in this paper, which combines CamemBERT and a linear layer, is also summarized in <xref ref-type="table" rid="table1">Table 1</xref>. All <italic>F</italic><sub>1</sub>-scores are higher than those of the baseline. The proposed model therefore obtained fewer misclassifications for each class than the baseline. This conclusion is particularly visible for positive tweet predictions, for which there were fewer missed true positives (recall). Those results were also confirmed by the confusion matrix (<xref rid="figure4" ref-type="fig">Figure 4</xref>). However, the margin of error was still rather high, as the accuracy was only 0.75 compared with 0.62 for the multinomial naïve Bayes model. However, it is important to keep in mind the ambiguity of most tweets, whose annotation is subject to personal interpretation.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Confusion matrix for CamemBERT and a linear layer.</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e37237_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Characteristics of Vaccine Mistrust</title>
        <p>In order to summarize the information obtained from this classification, 2 representations were chosen: the temporal presentation of the tweet counts per class and the presentation of the most common words for each sentiment. As neutral tweets provide little information on the reasons for vaccine mistrust, the visualizations will only focus on the positive and negative tweets. <xref rid="figure5" ref-type="fig">Figure 5</xref> displays the counts of positive and negative tweets per day during the study period. Word embeddings using FastText allowed us to identify a broader range of arguments for vaccine mistrust. However, this method included more negative opinion than positive opinion, compared with the counts per day if only tweets containing the word “vaccin” were considered. The wider the vocabulary is, the weaker the signals of vaccine mistrust that are detected.</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Counts of positive (blue) and negative (orange) tweets per day during the study period.</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e37237_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>It is thus possible to distinguish days with a higher activity than usual for both sentiments. We assumed that evaluation should focus on days when counts of tweets showing positive or negative sentiment showed a polarization of the users’ opinions, rather than days when the numbers of tweets were high but mostly neutral. As trends sometimes fluctuate a lot from one day to the next, there seemed to be temporary events of which users quickly take advantage.</p>
        <p>Simultaneously, it is possible to explore the most used vocabulary per sentiment. The following figures present the words (positive tweets in <xref rid="figure6" ref-type="fig">Figure 6</xref> and negative tweets in <xref rid="figure7" ref-type="fig">Figure 7</xref>) and bigrams (positive tweets in <xref rid="figure8" ref-type="fig">Figure 8</xref> and negative tweets in <xref rid="figure9" ref-type="fig">Figure 9</xref>) that were most frequent per sentiment. Discourses were more homogenous in the negative tweets, where they focused on alternative treatments (eg, “hydroxychloroquine”), political contestation of the government (eg, “désobéissance civile” [civil disobedience], “gilets jaunes” [yellow vests, named after the yellow high-visibility vests worn by protestors during a movement that emerged in France in October 2018]), and conspiracies (eg, “bill gates,” “boycott cac40”). “Raoult,” “chloroquine,” and “hydroxychloroquine” were the monograms the most discussed in negative tweets. “Didier Raoult” and “Professor Raoult” were the first and fourth bigrams, respectively, that were the most discussed in negative tweets.</p>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Most frequent words for positive tweets.</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e37237_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>Most frequent words for negative tweets.</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e37237_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure8" position="float">
          <label>Figure 8</label>
          <caption>
            <p>Most frequent bigrams for positive tweets.</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e37237_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure9" position="float">
          <label>Figure 9</label>
          <caption>
            <p>Most frequent bigrams for negative tweets.</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e37237_fig9.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Meanwhile, discussions about research advances were among the most common in the positive tweets. The most frequent positive terms focused on the efficiency or early results of the candidate vaccines (eg, “efficace contre” [effective against], “résultats encourageants” [encouraging results]). Nevertheless, positive tweets also communicated some terms like “chloroquine” that were mostly attributed to negative tweets.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Main Findings</title>
        <p>The objective of this study was to characterize the opinion of Twitter users on the subject of a potential vaccine against COVID-19. After a review of the literature in both the medical and machine learning domains, the chosen steps were to extract a set of relevant tweets, then to exploit them from a sentiment analysis perspective, and finally to explore these results. Using a vectorial vocabulary representation method proved to be a powerful way of broadening the lexical concept of vaccination during this pandemic. First, we implemented word embeddings using FastText and could identify 69 keywords representative of issues relative to vaccination against COVID-19. The relevance of these keywords was confirmed by their relative position on a PCA and their relation with news about COVID-19 in France (eg, a study questioning the use of chloroquine published then withdrawn from the Lancet or conspiratorial theses such as the participation of Bill Gates and 5G chips in vaccination campaigns with the aim of taking control of people).</p>
        <p>Second, we implemented a classifier based on CamemBERT, a French adaptation of BERT, a language model part of transformers with an <italic>F</italic><sub>1</sub>-score of 0.75 for predicting the opinion of Twitter users about potential vaccines against COVID-19. This allowed us to more precisely characterize tweets that presented positive or negative opinion on vaccination. We found that tweets with a negative opinion presented more polarized and political arguments than tweets with a positive opinion, and the role of treatments other than vaccines such as chloroquine was a major issue when discussing mistrust of vaccines.</p>
      </sec>
      <sec>
        <title>Related Work</title>
        <p>Most papers that evaluated tweets for extracting insights about vaccination against COVID-19 used an unsupervised approach, mainly topic models with latent Dirichlet allocation [<xref ref-type="bibr" rid="ref24">24</xref>], which means that a training set was not necessary. When sentiment analysis was performed, authors used a pretrained classifier most of the time, especially relying on Valence Aware Dictionary for Sentiment Reasoning (VADER) [<xref ref-type="bibr" rid="ref43">43</xref>], which is available in the NLTK Python library. Using a pretrained classifier expedites classification but presents the inconvenience that it is not specialized for the study domain. Transformers are currently acknowledged as presenting the best performances in several NLP tasks. Tweets are more difficult to classify due to their characteristics: They are limited to 280 characters but can be much shorter; they are not necessarily written with correct syntax; and they can contain abbreviations, misspellings, and slang words [<xref ref-type="bibr" rid="ref44">44</xref>]. We also observed that the results of predictions are generally significantly better for correctly written texts such as PubMed abstracts, than with tweets, for example [<xref ref-type="bibr" rid="ref45">45</xref>].</p>
        <p>In previous work, several custom algorithms were proposed, such as (1) deep learning with a CamemBERT model [<xref ref-type="bibr" rid="ref28">28</xref>], BERT [<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref47">47</xref>], RoBERTa [<xref ref-type="bibr" rid="ref48">48</xref>], FastText [<xref ref-type="bibr" rid="ref49">49</xref>], convolutional neural network–long short-term memory with word2vec embeddings [<xref ref-type="bibr" rid="ref50">50</xref>] or (2) machine learning with naïve Bayes [<xref ref-type="bibr" rid="ref51">51</xref>] or decision tree [<xref ref-type="bibr" rid="ref52">52</xref>] models. Off-the-shelf sentiment analysis models include Amazon Web Services Comprehend sentiment analysis [<xref ref-type="bibr" rid="ref53">53</xref>] and VADER [<xref ref-type="bibr" rid="ref54">54</xref>-<xref ref-type="bibr" rid="ref60">60</xref>], which is a Python lexicon and rule-based sentiment analysis tool [<xref ref-type="bibr" rid="ref43">43</xref>]. In a recent evaluation of 11 sentiment analysis tools on 7 social media data sets, He et al [<xref ref-type="bibr" rid="ref61">61</xref>] observed that these tools do not provide results that are accurate enough to aid in public health decision-making. Among all tools, VADER was one of the 3 top performers.</p>
        <p>Our <italic>F</italic>1-score was 0.75, but it is at the same level as the best scores obtained in other papers in which this score is available. Some papers provided only partial results that did not allow a comparison, and most provided no metrics for the classifier. Li et al [<xref ref-type="bibr" rid="ref55">55</xref>] obtained <italic>F</italic><sub>1</sub>-scores of 0.76 for “unrelated” (class 0), 0.50 for “positive” (class 1), and 0.37 for “negative” (class –1), which means that we obtained better results if we consider the average of the scores of the 3 classes. Mønsted and Lehmann [<xref ref-type="bibr" rid="ref49">49</xref>] obtained a micro-averaged <italic>F</italic><sub>1</sub>-score of 0.762 for a 3-class prediction, which is a good result considering that the authors used Amazon’s Mechanical Turk platform. Sauvayre et al [<xref ref-type="bibr" rid="ref28">28</xref>] classified tweets according to the opinion for or against users and obtained an accuracy of 0.706 using a fine-tuned CamemBERT prediction model with 2 classes, whereas we used 3 classes, which is more unfavorable. Kummervold et al [<xref ref-type="bibr" rid="ref46">46</xref>] obtained an <italic>F</italic><sub>1</sub>-score of 0.78 to predict the attitude of pregnant women toward vaccination against COVID-19, but the categories for the classification were different. Portelli et al [<xref ref-type="bibr" rid="ref48">48</xref>] used a RoBERTa model trained on TweetEval Benchmark. However, the authors only provided the recall for sentiment analysis, which was 72.1, and not the precision, which does not allow a comparison with our results.</p>
        <p>To improve our results, we propose using multitask training or pretrained embeddings. Multitask learning may improve results in some cases, but it is not systematic. This confirms that data science is an empirical discipline in which only experiments make it possible to determine the most appropriate approach in a defined context and that there is no method that makes it possible to confidently improve the results. In some cases, multitask learning made it possible to improve the results [<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref63">63</xref>]. However, previous studies, such as that by Rodriguez et al [<xref ref-type="bibr" rid="ref64">64</xref>], observed that multitask learning did not improve the results in general. However, it was possible to train the model on a simple task using transfer learning from the multitask model, obtaining better performance using less data. For the detection of fake news on COVID-19, Malla and Alphonse [<xref ref-type="bibr" rid="ref65">65</xref>] showed how it could be interesting to use a CT-BERT (COVID-Twitter-BERT) model [<xref ref-type="bibr" rid="ref25">25</xref>] but not a BERTweet model [<xref ref-type="bibr" rid="ref66">66</xref>]. In 2020, Lee et al [<xref ref-type="bibr" rid="ref67">67</xref>] proposed BioBERT, a language model pretrained on PubMed abstracts and PubMed Central full-text articles, that largely outperformed BERT for biomedical NLP tasks. Similarly, Med-BERT, a pretrained model on a structured electronic health record data set of 28,490,650 patients [<xref ref-type="bibr" rid="ref68">68</xref>], allows working with smaller training sets while obtaining better performance.</p>
        <p>In this study, we used Twitter rather than other social media platforms such as Facebook or Reddit. In fact, Wawrzuta et al [<xref ref-type="bibr" rid="ref69">69</xref>] suggested that Facebook is more appropriate when evaluating public opinion because it has more active users compared with Twitter and Instagram and it is more representative of society’s demography than Twitter and Instagram, on which young city dwellers with a good level of education are overrepresented. However, Facebook does not provide an API allowing it to extract posts based on keywords. This is why it is necessary to clearly define and identify the discussion groups on which the study will focus [<xref ref-type="bibr" rid="ref70">70</xref>]. Furthermore, it can be assumed that a poor selection of these groups could lead to biases when interpreting the data. One of the interests with Reddit, a discussion forum, is that it is divided into subreddits for which one can have an overview of the posts that relate to a place or a particular topic. This is not the case with Twitter on which the discussions concern rather a vast community and do not make it possible to know the specifics of the discussions in regional communities [<xref ref-type="bibr" rid="ref71">71</xref>].</p>
      </sec>
      <sec>
        <title>Tweet Content Analysis</title>
        <p>Throughout the health crisis, the media maintained a high level of attention on treatments against COVID-19. For example, Professor Didier Raoult, an internationally renowned French microbiologist [<xref ref-type="bibr" rid="ref72">72</xref>], presented a study from the Institut Hospitalier Universitaire de Marseille, in which a treatment combining hydroxychloroquine and azithromycin made it possible to significantly decrease the viral load in patients with COVID-19 [<xref ref-type="bibr" rid="ref73">73</xref>]. Part of the population was then doubtful of the reasons why health authorities did not authorize using these drugs. Believing that some therapeutic means are highly efficient at curing the disease makes it less desirable to apply preventive measures, which might have affected the perception of potential vaccines against COVID-19. The neighborhood of “hydroxychloroquine,” “vaccination,” and “Raoult” observed with the PCA in <xref rid="figure2" ref-type="fig">Figure 2</xref> confirms our assumption that the perception of vaccines should be considered in relation to the perception of hydroxychloroquine. Additionally, a large portion of negative posts identified with our classifier mentioned chloroquine or hydroxychloroquine or tweets about Didier Raoult. However, PCA does not allow the evaluation of whether believing a treatment is efficient for quick healing may influence the intention of individuals to protect themselves, because the proximity relations on the PCA are not categorized. Nevertheless, further experiments with data from more recent time periods could help to determine if such relations should also be considered between vaccines and other presumed treatments such as ivermectin [<xref ref-type="bibr" rid="ref74">74</xref>] or azithromycin [<xref ref-type="bibr" rid="ref75">75</xref>]. As we found pharmaceutical companies that are only relevant to the vaccine or the COVID-19 crisis (eg, Gilead proposing an alternative treatment) and not others, we can assume that we applied a successful keyword selection strategy able to select relevant keywords. Our analysis revealed the dominant discourses and weak signals of vaccine mistrust.</p>
        <p>After annotating a subset of tweets, an efficient classification implementing the state-of-the-art of NLP was able to reveal temporal trends in sentiment about potential vaccination against COVID-19. Moreover, further explorations of the vocabulary gave a different view of vaccine mistrust arguments.</p>
        <p>Hence, there appears to be a change in the profile of Twitter users on this issue. According to Massey et al [<xref ref-type="bibr" rid="ref76">76</xref>], Twitter seemed to be used more by profiles confident in the HPV vaccine, whereas our study showed a greater sharing of opposition against the announced COVID-19 vaccine, notably driven by political mistrust. Skepticism already observed with other vaccines could influence people who remain uncertain about vaccination because of the large audience that distrustful tweets have.</p>
        <p>These observations may help the regulatory authorities to disseminate credible information by providing clear, precise communication around a potential campaign. The success of a vaccination campaign depends not only on sufficient coverage of the population to obtain collective immunity but also, and above all, on the acceptance of such a campaign by the same population. This study tends to clarify reasons for vaccine mistrust based on users’ reactions on social media.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>The main limitation is that the annotation was performed by a single annotator. Additional experiments involving additional annotators have shown that annotations can be different in a very large number of tweets. This certainly reflects significant subjectivity related to the interpretation of the content of tweets in the chosen field. It would be interesting to take into account the role of emoticons in tweets because they can possibly help to better interpret the content, especially in the case of ironic content that we risk taking at face value.</p>
        <p>This study focused on exploiting the textual information of Twitter but did not extract any further metadata such as users’ information. However, a preliminary experiment that we conducted earlier showed that medical professionals seem to be excluded from the debate on Twitter, except for a few personalities who are against a potential vaccine. This could lead to a better understanding of the observed dynamics.</p>
        <p>Another limitation rests on the performances of the sentiment analysis. The model could achieve better performances in the near future with better parameter optimization and further exploration of other approaches. Models that are unsupervised like zero-shot learning could be interesting for additional investigation. Finally, it is important to emphasize that this study is not representative of neither the French population nor Twitter users in general.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>We proposed an approach that allows the selection of keywords using word embeddings with FastText and obtain a visual representation according to their closeness to one another with PCA. Then, we implemented a classifier using BERT that allows the prediction of the opinion on COVID-19 vaccines by Twitter users. Our study showed that Twitter could be a useful tool to investigate the arguments around vaccine mistrust (eg, the role of 5G in vaccination and discussions about other treatments such as chloroquine). Our results unveil that political aspects of vaccination overshadow its usual criticisms about adverse drug reactions. As the opposition rhetoric is generally more homogenous and more widely spread than the positive rhetoric, we believe that this study provides effective tools to help health authorities better understand vaccine mistrust.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>List of 24 word pairs in French used for the Discounted Cumulative Gain (DCG).</p>
        <media xlink:href="jmir_v25i1e37237_app1.docx" xlink:title="DOCX File , 28 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>List of the 69 selected keywords.</p>
        <media xlink:href="jmir_v25i1e37237_app2.docx" xlink:title="DOCX File , 35 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">API</term>
          <def>
            <p>application programming interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">BERT</term>
          <def>
            <p>Bidirectional Encoder Representations from Transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">DCG</term>
          <def>
            <p>Discounted Cumulative Gain</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">HPV</term>
          <def>
            <p>human papillomavirus</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">PCA</term>
          <def>
            <p>principal component analysis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">TF-IDF</term>
          <def>
            <p>term frequency-inverse document frequency</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">VADER</term>
          <def>
            <p>Valence Aware Dictionary for Sentiment Reasoning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">WHO</term>
          <def>
            <p>World Health Organization</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was funded by grant number ANR-16-CE23-0011-01 from the French Agence nationale de la Recherche (ANR) through the Pharmacovigilance enrichie par des Groupements Améliorant la detection des Signaux Emergents (PEGASE) project. Exaion, a new subsidiary of the Électricité de France group, a cloud provider of blockchain and high-performance computing solutions, lent one of its servers with 2 graphical processing units free of charge for the duration of the study. We thank the representatives of Exaion for providing technical support for this server: Fatih Balyeli, Laurent Bernou-Mazars, Nicolas Meaux, and Vivien Sayve. Exaion never intervened in the conduct nor interpretation of the study. We acknowledge the work of the Panacea Lab in collecting tweets related to the COVID-19 pandemic. The views mentioned in this article are those of the authors only.</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The original data set providing the tweets’ IDs can be found on the Panacea Lab GitHub site [<xref ref-type="bibr" rid="ref77">77</xref>]. The code is available at [<xref ref-type="bibr" rid="ref78">78</xref>], and the annotated training set is available on request.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>ADZ implemented the embeddings and the classifier and performed the analysis. BA collected data from the Panacea Lab GitHub repository and extracted tweets from Twitter, administered the server, and installed the necessary libraries and tools. ADZ and CB drafted the manuscript. CD and CG defined the rules for classifying tweets. AGB provided support on designing the study and reviewing results. All coauthors revised the article critically for important intellectual content and provided final approval of the version to be submitted.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>MacDonald</surname>
              <given-names>NE</given-names>
            </name>
            <collab>SAGE Working Group on Vaccine Hesitancy</collab>
          </person-group>
          <article-title>Vaccine hesitancy: Definition, scope and determinants</article-title>
          <source>Vaccine</source>
          <year>2015</year>
          <month>08</month>
          <day>14</day>
          <volume>33</volume>
          <issue>34</issue>
          <fpage>4161</fpage>
          <lpage>4</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0264-410X(15)00500-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.vaccine.2015.04.036</pub-id>
          <pub-id pub-id-type="medline">25896383</pub-id>
          <pub-id pub-id-type="pii">S0264-410X(15)00500-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ward</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Alleaume</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Peretti-Watel</surname>
              <given-names>P</given-names>
            </name>
            <collab>COCONEL Group</collab>
          </person-group>
          <article-title>The French public's attitudes to a future COVID-19 vaccine: The politicization of a public health issue</article-title>
          <source>Soc Sci Med</source>
          <year>2020</year>
          <month>11</month>
          <volume>265</volume>
          <fpage>113414</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33038683"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.socscimed.2020.113414</pub-id>
          <pub-id pub-id-type="medline">33038683</pub-id>
          <pub-id pub-id-type="pii">S0277-9536(20)30633-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC7537647</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wakefield</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Murch</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Anthony</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Linnell</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Casson</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Malik</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Berelowitz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dhillon</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Thomson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Harvey</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Valentine</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Davies</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Walker-Smith</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Ileal-lymphoid-nodular hyperplasia, non-specific colitis, and pervasive developmental disorder in children</article-title>
          <source>Lancet</source>
          <year>1998</year>
          <month>02</month>
          <day>28</day>
          <volume>351</volume>
          <issue>9103</issue>
          <fpage>637</fpage>
          <lpage>41</lpage>
          <pub-id pub-id-type="doi">10.1016/s0140-6736(97)11096-0</pub-id>
          <pub-id pub-id-type="medline">9500320</pub-id>
          <pub-id pub-id-type="pii">S0140673697110960</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Deer</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>How the case against the MMR vaccine was fixed</article-title>
          <source>BMJ</source>
          <year>2011</year>
          <month>01</month>
          <day>05</day>
          <volume>342</volume>
          <issue>jan05 1</issue>
          <fpage>c5347</fpage>
          <lpage>c5347</lpage>
          <pub-id pub-id-type="doi">10.1136/bmj.c5347</pub-id>
          <pub-id pub-id-type="medline">21209059</pub-id>
          <pub-id pub-id-type="pii">bmj.c5347</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peretti-Watel</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Seror</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Cortaredona</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Launay</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Raude</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Verger</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Fressard</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Beck</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Legleye</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>L'Haridon</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Léger</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ward</surname>
              <given-names>JK</given-names>
            </name>
          </person-group>
          <article-title>A future vaccination campaign against COVID-19 at risk of vaccine hesitancy and politicisation</article-title>
          <source>The Lancet Infectious Diseases</source>
          <year>2020</year>
          <month>07</month>
          <volume>20</volume>
          <issue>7</issue>
          <fpage>769</fpage>
          <lpage>770</lpage>
          <pub-id pub-id-type="doi">10.1016/s1473-3099(20)30426-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Detoc</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bruel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Frappe</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Tardy</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Botelho-Nevers</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gagneux-Brunon</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Intention to participate in a COVID-19 vaccine clinical trial and to get vaccinated against COVID-19 in France during the pandemic</article-title>
          <source>Vaccine</source>
          <year>2020</year>
          <month>10</month>
          <day>21</day>
          <volume>38</volume>
          <issue>45</issue>
          <fpage>7002</fpage>
          <lpage>7006</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32988688"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.vaccine.2020.09.041</pub-id>
          <pub-id pub-id-type="medline">32988688</pub-id>
          <pub-id pub-id-type="pii">S0264-410X(20)31201-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC7498238</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <article-title>Global Attitudes on a COVID-19 Vaccine</article-title>
          <source>IPSOS</source>
          <year>2020</year>
          <access-date>2023-02-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ipsos.com/sites/default/files/ct/news/documents/2020-11/global-attitudes-on-a-covid-19-vaccine-oct-2020.pdf">https://www.ipsos.com/sites/default/files/ct/news/documents/2020-11/global-attitudes-on-a-covid-19-vaccine-oct-2020.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lazarus</surname>
              <given-names>JV</given-names>
            </name>
            <name name-style="western">
              <surname>Ratzan</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Palayew</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gostin</surname>
              <given-names>LO</given-names>
            </name>
            <name name-style="western">
              <surname>Larson</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Rabin</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kimball</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>El-Mohandes</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A global survey of potential acceptance of a COVID-19 vaccine</article-title>
          <source>Nat Med</source>
          <year>2021</year>
          <month>02</month>
          <volume>27</volume>
          <issue>2</issue>
          <fpage>225</fpage>
          <lpage>228</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33082575"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41591-020-1124-9</pub-id>
          <pub-id pub-id-type="medline">33082575</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-020-1124-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC7573523</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Neumann-Böhme</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Varghese</surname>
              <given-names>NE</given-names>
            </name>
            <name name-style="western">
              <surname>Sabat</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Barros</surname>
              <given-names>PP</given-names>
            </name>
            <name name-style="western">
              <surname>Brouwer</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>van Exel</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schreyögg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stargardt</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Once we have it, will we use it? A European survey on willingness to be vaccinated against COVID-19</article-title>
          <source>Eur J Health Econ</source>
          <year>2020</year>
          <month>09</month>
          <day>26</day>
          <volume>21</volume>
          <issue>7</issue>
          <fpage>977</fpage>
          <lpage>982</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32591957"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s10198-020-01208-6</pub-id>
          <pub-id pub-id-type="medline">32591957</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10198-020-01208-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC7317261</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Freeman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Loe</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Freeman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chadwick</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Vaccari</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Shanyinde</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Waite</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Rosebrock</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Petit</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Vanderslott</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lewandowsky</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Larkin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Innocenti</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pollard</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>McShane</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lambe</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Effects of different types of written vaccination information on COVID-19 vaccine hesitancy in the UK (OCEANS-III): a single-blind, parallel-group, randomised controlled trial</article-title>
          <source>The Lancet Public Health</source>
          <year>2021</year>
          <month>06</month>
          <volume>6</volume>
          <issue>6</issue>
          <fpage>e416</fpage>
          <lpage>e427</lpage>
          <pub-id pub-id-type="doi">10.1016/s2468-2667(21)00096-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Public Opinions towards COVID-19 in California and New York on Twitter</article-title>
          <source>medRxiv. Preprint posted online July 14, 2020</source>
          <pub-id pub-id-type="doi">10.1101/2020.07.12.20151936</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zimet</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A natural language processing framework to analyse the opinions on HPV vaccination reflected in twitter over 10 years (2008 - 2017)</article-title>
          <source>Human Vaccines &#38; Immunotherapeutics</source>
          <year>2019</year>
          <month>07</month>
          <day>16</day>
          <volume>15</volume>
          <issue>7-8</issue>
          <fpage>1496</fpage>
          <lpage>1504</lpage>
          <pub-id pub-id-type="doi">10.1080/21645515.2019.1627821</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sha</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Al Hasan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mohler</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Brantingham</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>Dynamic topic modeling of the COVID-19 Twitter narrative among U.S. governors and cabinet executives</article-title>
          <source>arXiv. Preprint posted online April 19, 2020</source>
          <pub-id pub-id-type="doi">10.48550/arXiv.2004.11692</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Daughton</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Shelley</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Barnard</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gerts</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Watson Ross</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Crooker</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Nadiga</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Mukundan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Vaquera Chavez</surname>
              <given-names>NY</given-names>
            </name>
            <name name-style="western">
              <surname>Parikh</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Pitts</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fairchild</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Mining and validating social media data for COVID-19-related human behaviors between January and July 2020: infodemiology study</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>05</month>
          <day>25</day>
          <volume>23</volume>
          <issue>5</issue>
          <fpage>e27059</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/5/e27059/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/27059</pub-id>
          <pub-id pub-id-type="medline">33882015</pub-id>
          <pub-id pub-id-type="pii">v23i5e27059</pub-id>
          <pub-id pub-id-type="pmcid">PMC8153035</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ge</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Janies</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>A novel machine learning framework for comparison of viral COVID-19-related Sina Weibo and Twitter posts: workflow development and content analysis</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>01</month>
          <day>06</day>
          <volume>23</volume>
          <issue>1</issue>
          <fpage>e24889</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/1/e24889/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/24889</pub-id>
          <pub-id pub-id-type="medline">33326408</pub-id>
          <pub-id pub-id-type="pii">v23i1e24889</pub-id>
          <pub-id pub-id-type="pmcid">PMC7790734</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adikari</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nawaratne</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>De Silva</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ranasinghe</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Alahakoon</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Alahakoon</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Emotions of COVID-19: content analysis of self-reported information using artificial intelligence</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>04</month>
          <day>30</day>
          <volume>23</volume>
          <issue>4</issue>
          <fpage>e27341</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/4/e27341/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/27341</pub-id>
          <pub-id pub-id-type="medline">33819167</pub-id>
          <pub-id pub-id-type="pii">v23i4e27341</pub-id>
          <pub-id pub-id-type="pmcid">PMC8092030</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Quinn</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Hancock</surname>
              <given-names>GR</given-names>
            </name>
            <name name-style="western">
              <surname>Freimuth</surname>
              <given-names>VS</given-names>
            </name>
            <name name-style="western">
              <surname>Jamison</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Social media use and influenza vaccine uptake among White and African American adults</article-title>
          <source>Vaccine</source>
          <year>2018</year>
          <month>11</month>
          <day>26</day>
          <volume>36</volume>
          <issue>49</issue>
          <fpage>7556</fpage>
          <lpage>7561</lpage>
          <pub-id pub-id-type="doi">10.1016/j.vaccine.2018.10.049</pub-id>
          <pub-id pub-id-type="medline">30389192</pub-id>
          <pub-id pub-id-type="pii">S0264-410X(18)31415-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wawrzuta</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Jaworski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gotlib</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Panczyk</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Characteristics of antivaccine messages on social media: systematic review</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>06</month>
          <day>04</day>
          <volume>23</volume>
          <issue>6</issue>
          <fpage>e24564</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/6/e24564/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/24564</pub-id>
          <pub-id pub-id-type="medline">34085943</pub-id>
          <pub-id pub-id-type="pii">v23i6e24564</pub-id>
          <pub-id pub-id-type="pmcid">PMC8214178</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Massey</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Kearney</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Hauer</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Selvan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Koku</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Leader</surname>
              <given-names>AE</given-names>
            </name>
          </person-group>
          <article-title>Dimensions of misinformation about the HPV vaccine on Instagram: content and network analysis of social media characteristics</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>12</month>
          <day>03</day>
          <volume>22</volume>
          <issue>12</issue>
          <fpage>e21451</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/12/e21451/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/21451</pub-id>
          <pub-id pub-id-type="medline">33270038</pub-id>
          <pub-id pub-id-type="pii">v22i12e21451</pub-id>
          <pub-id pub-id-type="pmcid">PMC7746500</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Skeppstedt</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kerren</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Stede</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Vaccine Hesitancy in Discussion Forums: Computer-Assisted Argument Mining with Topic Models</article-title>
          <source>The Communication Initiative Network</source>
          <year>2018</year>
          <month>06</month>
          <day>15</day>
          <access-date>2023-02-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.comminit.com/content/vaccine-hesitancy-discussion-forums-computer-assisted-argument-mining-topic-models">https://www.comminit.com/content/vaccine-hesitancy-discussion-forums-computer-assisted-argument-mining-topic-models</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rao</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cong</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Sentiment analysis methods for HPV vaccines related tweets based on transfer learning</article-title>
          <source>Healthcare (Basel)</source>
          <year>2020</year>
          <month>08</month>
          <day>28</day>
          <volume>8</volume>
          <issue>3</issue>
          <fpage>307</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=healthcare8030307"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/healthcare8030307</pub-id>
          <pub-id pub-id-type="medline">32872330</pub-id>
          <pub-id pub-id-type="pii">healthcare8030307</pub-id>
          <pub-id pub-id-type="pmcid">PMC7551482</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hussain</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tahir</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hussain</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Sheikh</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Gogate</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dashtipour</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sheikh</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence-enabled analysis of public attitudes on Facebook and Twitter toward COVID-19 vaccines in the United Kingdom and the United States: observational study</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>04</month>
          <day>05</day>
          <volume>23</volume>
          <issue>4</issue>
          <fpage>e26627</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/4/e26627/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/26627</pub-id>
          <pub-id pub-id-type="medline">33724919</pub-id>
          <pub-id pub-id-type="pii">v23i4e26627</pub-id>
          <pub-id pub-id-type="pmcid">PMC8023383</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kwok</surname>
              <given-names>SWH</given-names>
            </name>
            <name name-style="western">
              <surname>Vadde</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Tweet topics and sentiments relating to COVID-19 vaccination among Australian Twitter users: machine learning analysis</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>05</month>
          <day>19</day>
          <volume>23</volume>
          <issue>5</issue>
          <fpage>e26953</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/5/e26953/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/26953</pub-id>
          <pub-id pub-id-type="medline">33886492</pub-id>
          <pub-id pub-id-type="pii">v23i5e26953</pub-id>
          <pub-id pub-id-type="pmcid">PMC8136408</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>AY</given-names>
            </name>
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>MI</given-names>
            </name>
          </person-group>
          <article-title>Latent Dirichlet allocation</article-title>
          <source>Journal of Machine Learning Research</source>
          <year>2003</year>
          <volume>3</volume>
          <fpage>993</fpage>
          <lpage>1022</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmlr.org/papers/volume3/blei03a/blei03a.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Salathé</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kummervold</surname>
              <given-names>PE</given-names>
            </name>
          </person-group>
          <article-title>COVID-Twitter-BERT: a natural language processing model to analyse COVID-19 content on Twitter</article-title>
          <source>arXiv. Preprint posted online May 15, 2020</source>
          <pub-id pub-id-type="doi">10.48550/arXiv.2005.07503</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arnaud</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Elbattah</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gignon</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dequen</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Learning embeddings from free-text triage notes using pretrained transformer models</article-title>
          <source>HEALTHINF: Proceedings of the 15th International Joint Conference on Biomedical Engineering Systems and Technologies</source>
          <year>2022</year>
          <volume>5</volume>
          <fpage>835</fpage>
          <lpage>841</lpage>
          <pub-id pub-id-type="doi">10.5220/0011012800003123</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blanc</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bailly</surname>
              <given-names>A</given-names>
            </name>
            <collab>Francis</collab>
            <name name-style="western">
              <surname>Guillotin</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Jamal</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wakim</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Roy</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>FlauBERT vs. CamemBERT: Understanding patient's answers by a French medical chatbot</article-title>
          <source>Artif Intell Med</source>
          <year>2022</year>
          <month>05</month>
          <volume>127</volume>
          <fpage>102264</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0933-3657(22)00029-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2022.102264</pub-id>
          <pub-id pub-id-type="medline">35430035</pub-id>
          <pub-id pub-id-type="pii">S0933-3657(22)00029-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sauvayre</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Vernier</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chauvière</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>An analysis of French-language tweets about COVID-19 vaccines: supervised learning approach</article-title>
          <source>JMIR Med Inform</source>
          <year>2022</year>
          <month>05</month>
          <day>17</day>
          <volume>10</volume>
          <issue>5</issue>
          <fpage>e37831</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2022/5/e37831/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/37831</pub-id>
          <pub-id pub-id-type="medline">35512274</pub-id>
          <pub-id pub-id-type="pii">v10i5e37831</pub-id>
          <pub-id pub-id-type="pmcid">PMC9116457</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
          <article-title>Ten threats to global health in 2019</article-title>
          <source>World Health Organization</source>
          <access-date>2021-06-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/news-room/spotlight/ten-threats-to-global-health-in-2019">https://www.who.int/news-room/spotlight/ten-threats-to-global-health-in-2019</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Landry</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Paluszek</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Groenewoud</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rachor</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Asmundson</surname>
              <given-names>GJG</given-names>
            </name>
          </person-group>
          <article-title>A proactive approach for managing COVID-19: the importance of understanding the motivational roots of vaccination hesitancy for SARS-CoV2</article-title>
          <source>Front Psychol</source>
          <year>2020</year>
          <month>10</month>
          <day>19</day>
          <volume>11</volume>
          <fpage>575950</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33192883"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpsyg.2020.575950</pub-id>
          <pub-id pub-id-type="medline">33192883</pub-id>
          <pub-id pub-id-type="pmcid">PMC7604422</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jolley</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Douglas</surname>
              <given-names>KM</given-names>
            </name>
          </person-group>
          <article-title>The effects of anti-vaccine conspiracy theories on vaccination intentions</article-title>
          <source>PLoS One</source>
          <year>2014</year>
          <month>2</month>
          <day>20</day>
          <volume>9</volume>
          <issue>2</issue>
          <fpage>e89177</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0089177"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0089177</pub-id>
          <pub-id pub-id-type="medline">24586574</pub-id>
          <pub-id pub-id-type="pii">PONE-D-13-38770</pub-id>
          <pub-id pub-id-type="pmcid">PMC3930676</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shahsavari</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Holur</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tangherlini</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Roychowdhury</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Conspiracy in the time of corona: automatic detection of emerging COVID-19 conspiracy theories in social media and the news</article-title>
          <source>J Comput Soc Sci</source>
          <year>2020</year>
          <volume>3</volume>
          <issue>2</issue>
          <fpage>279</fpage>
          <lpage>317</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33134595"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s42001-020-00086-5</pub-id>
          <pub-id pub-id-type="medline">33134595</pub-id>
          <pub-id pub-id-type="pii">86</pub-id>
          <pub-id pub-id-type="pmcid">PMC7591696</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Audureau</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Anti-vaccine discourse, well established in France, has redoubled its vigor with the health crisis</article-title>
          <source>Le Monde</source>
          <year>2020</year>
          <month>06</month>
          <day>10</day>
          <access-date>2021-08-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.lemonde.fr/les-decodeurs/article/2020/06/10/pour-les-antivaccins-les-deux-themes-dominants-sont-big-brother-et-big-pharma_6042339_4355770.html">https://www.lemonde.fr/les-decodeurs/article/2020/06/10/pour-les-antivaccins-les-deux-themes-dominants-sont-big-brother-et-big-pharma_6042339_4355770.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mehra</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Desai</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Ruschitzka</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>AN</given-names>
            </name>
          </person-group>
          <article-title>RETRACTED: Hydroxychloroquine or chloroquine with or without a macrolide for treatment of COVID-19: a multinational registry analysis</article-title>
          <source>The Lancet</source>
          <year>2020</year>
          <month>5</month>
          <fpage>1</fpage>
          <pub-id pub-id-type="doi">10.1016/s0140-6736(20)31180-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mehra</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Desai</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Kuy</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Henry</surname>
              <given-names>TD</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>AN</given-names>
            </name>
          </person-group>
          <article-title>Retraction: cardiovascular disease, drug therapy, and mortality in Covid-19</article-title>
          <source>N Engl J Med</source>
          <year>2020</year>
          <month>06</month>
          <day>25</day>
          <volume>382</volume>
          <issue>26</issue>
          <fpage>2582</fpage>
          <lpage>2582</lpage>
          <pub-id pub-id-type="doi">10.1056/nejmc2021225</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vosoughi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Roy</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Aral</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>The spread of true and false news online</article-title>
          <source>Science</source>
          <year>2018</year>
          <month>03</month>
          <day>09</day>
          <volume>359</volume>
          <issue>6380</issue>
          <fpage>1146</fpage>
          <lpage>1151</lpage>
          <pub-id pub-id-type="doi">10.1126/science.aap9559</pub-id>
          <pub-id pub-id-type="medline">29590045</pub-id>
          <pub-id pub-id-type="pii">359/6380/1146</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>The Lancet Infectious Diseases</collab>
          </person-group>
          <article-title>The COVID-19 infodemic</article-title>
          <source>The Lancet Infectious Diseases</source>
          <year>2020</year>
          <month>08</month>
          <volume>20</volume>
          <issue>8</issue>
          <fpage>875</fpage>
          <pub-id pub-id-type="doi">10.1016/s1473-3099(20)30565-x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Burki</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>The online anti-vaccine movement in the age of COVID-19</article-title>
          <source>The Lancet Digital Health</source>
          <year>2020</year>
          <month>10</month>
          <volume>2</volume>
          <issue>10</issue>
          <fpage>e504</fpage>
          <lpage>e505</lpage>
          <pub-id pub-id-type="doi">10.1016/s2589-7500(20)30227-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Grimes</surname>
              <given-names>DR</given-names>
            </name>
          </person-group>
          <article-title>Health disinformation &#38; social media: The crucial role of information hygiene in mitigating conspiracy theory and infodemics</article-title>
          <source>EMBO Rep</source>
          <year>2020</year>
          <month>11</month>
          <day>05</day>
          <volume>21</volume>
          <issue>11</issue>
          <fpage>e51819</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33155436"/>
          </comment>
          <pub-id pub-id-type="doi">10.15252/embr.202051819</pub-id>
          <pub-id pub-id-type="medline">33155436</pub-id>
          <pub-id pub-id-type="pmcid">PMC7645170</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Banda</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Tekumalla</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Artemova</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Tutubalina</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Chowell</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>A large-scale COVID-19 Twitter chatter dataset for open scientific research-an international collaboration</article-title>
          <source>Epidemiologia (Basel)</source>
          <year>2021</year>
          <month>08</month>
          <day>05</day>
          <volume>2</volume>
          <issue>3</issue>
          <fpage>315</fpage>
          <lpage>324</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=epidemiologia2030024"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/epidemiologia2030024</pub-id>
          <pub-id pub-id-type="medline">36417228</pub-id>
          <pub-id pub-id-type="pii">epidemiologia2030024</pub-id>
          <pub-id pub-id-type="pmcid">PMC9620940</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>BERT: pre-training of deep Bidirectional Transformers for language understanding</article-title>
          <source>Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers)</source>
          <year>2019</year>
          <fpage>4171</fpage>
          <lpage>4186</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/N19-1423</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Muller</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Suárez</surname>
              <given-names>PJO</given-names>
            </name>
            <name name-style="western">
              <surname>Dupont</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Romary</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>de la Clergerie</surname>
              <given-names>EV</given-names>
            </name>
            <name name-style="western">
              <surname>Seddah</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sagot</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>CamemBERT: a tasty French language model</article-title>
          <source>arXiv. Preprint posted online May 21, 2020</source>
          <pub-id pub-id-type="doi">10.18653/v1/2020.acl-main.645</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hutto</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gilbert</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>VADER: a parsimonious rule-based model for sentiment analysis of social media text</article-title>
          <source>Proceedings of the International AAAI Conference on Web and Social Media</source>
          <year>2014</year>
          <month>05</month>
          <day>16</day>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>216</fpage>
          <lpage>225</lpage>
          <pub-id pub-id-type="doi">10.1609/icwsm.v8i1.14550</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Visweswaran</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Colditz</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>O'Halloran</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Taneja</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Welling</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Sidani</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Primack</surname>
              <given-names>BA</given-names>
            </name>
          </person-group>
          <article-title>Machine learning classifiers for Twitter surveillance of vaping: comparative machine learning study</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>08</month>
          <day>12</day>
          <volume>22</volume>
          <issue>8</issue>
          <fpage>e17478</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/8/e17478/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/17478</pub-id>
          <pub-id pub-id-type="medline">32784184</pub-id>
          <pub-id pub-id-type="pii">v22i8e17478</pub-id>
          <pub-id pub-id-type="pmcid">PMC7450367</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hussain</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Afzal</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Saeed</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Iltaf</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Umair</surname>
              <given-names>MY</given-names>
            </name>
          </person-group>
          <article-title>Pharmacovigilance with transformers: a framework to detect adverse drug reactions using BERT fine-tuned with FARM</article-title>
          <source>Comput Math Methods Med</source>
          <year>2021</year>
          <month>8</month>
          <day>13</day>
          <volume>2021</volume>
          <fpage>5589829</fpage>
          <lpage>12</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1155/2021/5589829"/>
          </comment>
          <pub-id pub-id-type="doi">10.1155/2021/5589829</pub-id>
          <pub-id pub-id-type="medline">34422092</pub-id>
          <pub-id pub-id-type="pmcid">PMC8378963</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kummervold</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dada</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kilich</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Denny</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Paterson</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Larson</surname>
              <given-names>HJ</given-names>
            </name>
          </person-group>
          <article-title>Categorizing vaccine confidence with a transformer-based machine learning model: analysis of nuances of vaccine sentiment in Twitter discourse</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <month>10</month>
          <day>08</day>
          <volume>9</volume>
          <issue>10</issue>
          <fpage>e29584</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/10/e29584/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/29584</pub-id>
          <pub-id pub-id-type="medline">34623312</pub-id>
          <pub-id pub-id-type="pii">v9i10e29584</pub-id>
          <pub-id pub-id-type="pmcid">PMC8538052</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Monselise</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ferreira</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>CC</given-names>
            </name>
          </person-group>
          <article-title>Topics and sentiments of public concerns regarding COVID-19 vaccines: social media trend analysis</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>10</month>
          <day>21</day>
          <volume>23</volume>
          <issue>10</issue>
          <fpage>e30765</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/10/e30765/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/30765</pub-id>
          <pub-id pub-id-type="medline">34581682</pub-id>
          <pub-id pub-id-type="pii">v23i10e30765</pub-id>
          <pub-id pub-id-type="pmcid">PMC8534488</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Portelli</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Scaboro</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tonino</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Chersoni</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Santus</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Serra</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Monitoring user opinions and side effects on COVID-19 vaccines in the Twittersphere: infodemiology study of tweets</article-title>
          <source>J Med Internet Res</source>
          <year>2022</year>
          <month>05</month>
          <day>13</day>
          <volume>24</volume>
          <issue>5</issue>
          <fpage>e35115</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2022/5/e35115/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/35115</pub-id>
          <pub-id pub-id-type="medline">35446781</pub-id>
          <pub-id pub-id-type="pii">v24i5e35115</pub-id>
          <pub-id pub-id-type="pmcid">PMC9132143</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mønsted</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lehmann</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Characterizing polarization in online vaccine discourse-A large-scale study</article-title>
          <source>PLoS One</source>
          <year>2022</year>
          <month>2</month>
          <day>9</day>
          <volume>17</volume>
          <issue>2</issue>
          <fpage>e0263746</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0263746"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0263746</pub-id>
          <pub-id pub-id-type="medline">35139121</pub-id>
          <pub-id pub-id-type="pii">PONE-D-21-27127</pub-id>
          <pub-id pub-id-type="pmcid">PMC8827439</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bokaee Nezhad</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Deihimi</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Twitter sentiment analysis from Iran about COVID 19 vaccine</article-title>
          <source>Diabetes Metab Syndr</source>
          <year>2022</year>
          <month>01</month>
          <volume>16</volume>
          <issue>1</issue>
          <fpage>102367</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34933273"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.dsx.2021.102367</pub-id>
          <pub-id pub-id-type="medline">34933273</pub-id>
          <pub-id pub-id-type="pii">S1871-4021(21)00387-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC8667351</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rahmanti</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Chien</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Nursetyo</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Husnayain</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wiratama</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Fuad</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>YJ</given-names>
            </name>
          </person-group>
          <article-title>Social media sentiment analysis to monitor the performance of vaccination coverage during the early phase of the national COVID-19 vaccine rollout</article-title>
          <source>Comput Methods Programs Biomed</source>
          <year>2022</year>
          <month>06</month>
          <volume>221</volume>
          <fpage>106838</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35567863"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.cmpb.2022.106838</pub-id>
          <pub-id pub-id-type="medline">35567863</pub-id>
          <pub-id pub-id-type="pii">S0169-2607(22)00220-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC9045866</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chinnasamy</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Suresh</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Ramprathap</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Jebamani</surname>
              <given-names>BJA</given-names>
            </name>
            <name name-style="western">
              <surname>Srinivas Rao</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Shiva Kranthi</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>COVID-19 vaccine sentiment analysis using public opinions on Twitter</article-title>
          <source>Mater Today Proc</source>
          <year>2022</year>
          <volume>64</volume>
          <fpage>448</fpage>
          <lpage>451</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35502322"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.matpr.2022.04.809</pub-id>
          <pub-id pub-id-type="medline">35502322</pub-id>
          <pub-id pub-id-type="pii">S2214-7853(22)02986-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC9046075</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bari</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Heymann</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Szabo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Apas Vasandani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Khubchandani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>DiLorenzo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Coffee</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Exploring coronavirus disease 2019 vaccine hesitancy on Twitter using sentiment analysis and natural language processing algorithms</article-title>
          <source>Clin Infect Dis</source>
          <year>2022</year>
          <month>05</month>
          <day>15</day>
          <volume>74</volume>
          <issue>Suppl_3</issue>
          <fpage>e4</fpage>
          <lpage>e9</lpage>
          <pub-id pub-id-type="doi">10.1093/cid/ciac141</pub-id>
          <pub-id pub-id-type="medline">35568473</pub-id>
          <pub-id pub-id-type="pii">6585957</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chandrasekaran</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Desai</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Moustakas</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Examining public sentiments and attitudes toward COVID-19 vaccination: infoveillance study using Twitter posts</article-title>
          <source>JMIR Infodemiology</source>
          <year>2022</year>
          <month>4</month>
          <day>15</day>
          <volume>2</volume>
          <issue>1</issue>
          <fpage>e33909</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35462735"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/33909</pub-id>
          <pub-id pub-id-type="medline">35462735</pub-id>
          <pub-id pub-id-type="pii">v2i1e33909</pub-id>
          <pub-id pub-id-type="pmcid">PMC9014796</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Bensi</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Baecher</surname>
              <given-names>GB</given-names>
            </name>
          </person-group>
          <article-title>Dynamic assessment of the COVID-19 vaccine acceptance leveraging social media data</article-title>
          <source>J Biomed Inform</source>
          <year>2022</year>
          <month>05</month>
          <volume>129</volume>
          <fpage>104054</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35331966"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2022.104054</pub-id>
          <pub-id pub-id-type="medline">35331966</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(22)00070-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC8935963</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Roe</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lowe</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Public perception of SARS-CoV-2 vaccinations on social media: questionnaire and sentiment analysis</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2021</year>
          <month>12</month>
          <day>10</day>
          <volume>18</volume>
          <issue>24</issue>
          <fpage>13028</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph182413028"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph182413028</pub-id>
          <pub-id pub-id-type="medline">34948638</pub-id>
          <pub-id pub-id-type="pii">ijerph182413028</pub-id>
          <pub-id pub-id-type="pmcid">PMC8700913</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huangfu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>COVID-19 vaccine tweets after vaccine rollout: sentiment-based topic modeling</article-title>
          <source>J Med Internet Res</source>
          <year>2022</year>
          <month>02</month>
          <day>08</day>
          <volume>24</volume>
          <issue>2</issue>
          <fpage>e31726</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2022/2/e31726/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/31726</pub-id>
          <pub-id pub-id-type="medline">34783665</pub-id>
          <pub-id pub-id-type="pii">v24i2e31726</pub-id>
          <pub-id pub-id-type="pmcid">PMC8827037</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Karami</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Goldschmidt</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Boyajieff</surname>
              <given-names>HR</given-names>
            </name>
            <name name-style="western">
              <surname>Najafabadi</surname>
              <given-names>MM</given-names>
            </name>
          </person-group>
          <article-title>COVID-19 vaccine and social media in the U.S.: exploring emotions and discussions on Twitter</article-title>
          <source>Vaccines (Basel)</source>
          <year>2021</year>
          <month>09</month>
          <day>23</day>
          <volume>9</volume>
          <issue>10</issue>
          <fpage>1059</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=vaccines9101059"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/vaccines9101059</pub-id>
          <pub-id pub-id-type="medline">34696167</pub-id>
          <pub-id pub-id-type="pii">vaccines9101059</pub-id>
          <pub-id pub-id-type="pmcid">PMC8540945</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liew</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>CS</given-names>
            </name>
          </person-group>
          <article-title>Examining the utility of social media in COVID-19 vaccination: unsupervised learning of 672,133 Twitter posts</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2021</year>
          <month>11</month>
          <day>03</day>
          <volume>7</volume>
          <issue>11</issue>
          <fpage>e29789</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2021/11/e29789/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/29789</pub-id>
          <pub-id pub-id-type="medline">34583316</pub-id>
          <pub-id pub-id-type="pii">v7i11e29789</pub-id>
          <pub-id pub-id-type="pmcid">PMC8568045</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yousefinaghani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dara</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mubareka</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Papadopoulos</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sharif</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>An analysis of COVID-19 vaccine sentiments and opinions on Twitter</article-title>
          <source>Int J Infect Dis</source>
          <year>2021</year>
          <month>07</month>
          <volume>108</volume>
          <fpage>256</fpage>
          <lpage>262</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1201-9712(21)00462-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijid.2021.05.059</pub-id>
          <pub-id pub-id-type="medline">34052407</pub-id>
          <pub-id pub-id-type="pii">S1201-9712(21)00462-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC8157498</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>He</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>They May Not Work! An evaluation of eleven sentiment analysis tools on seven social media datasets</article-title>
          <source>J Biomed Inform</source>
          <year>2022</year>
          <month>08</month>
          <volume>132</volume>
          <fpage>104142</fpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2022.104142</pub-id>
          <pub-id pub-id-type="medline">35835437</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(22)00155-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kades</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Sellner</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Koehler</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Full</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>TYE</given-names>
            </name>
            <name name-style="western">
              <surname>Kleesiek</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Maier-Hein</surname>
              <given-names>KH</given-names>
            </name>
          </person-group>
          <article-title>Adapting Bidirectional Encoder Representations from Transformers (BERT) to assess clinical semantic textual similarity: algorithm development and validation study</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <month>02</month>
          <day>03</day>
          <volume>9</volume>
          <issue>2</issue>
          <fpage>e22795</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/2/e22795/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/22795</pub-id>
          <pub-id pub-id-type="medline">33533728</pub-id>
          <pub-id pub-id-type="pii">v9i2e22795</pub-id>
          <pub-id pub-id-type="pmcid">PMC7889424</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Batsis</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Roth</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Exploring deep transfer learning techniques for Alzheimer's dementia detection</article-title>
          <source>Front Comput Sci</source>
          <year>2021</year>
          <month>05</month>
          <day>12</day>
          <volume>3</volume>
          <fpage>1</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34046588"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fcomp.2021.624683</pub-id>
          <pub-id pub-id-type="medline">34046588</pub-id>
          <pub-id pub-id-type="pii">624683</pub-id>
          <pub-id pub-id-type="pmcid">PMC8153512</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rodriguez</surname>
              <given-names>NE</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>McInnes</surname>
              <given-names>BT</given-names>
            </name>
          </person-group>
          <article-title>Effects of data and entity ablation on multitask learning models for biomedical entity recognition</article-title>
          <source>J Biomed Inform</source>
          <year>2022</year>
          <month>06</month>
          <volume>130</volume>
          <fpage>104062</fpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2022.104062</pub-id>
          <pub-id pub-id-type="medline">35413440</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(22)00078-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Malla</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Alphonse</surname>
              <given-names>PJA</given-names>
            </name>
          </person-group>
          <article-title>Fake or real news about COVID-19? Pretrained transformer model to detect potential misleading news</article-title>
          <source>Eur Phys J Spec Top</source>
          <year>2022</year>
          <month>01</month>
          <day>13</day>
          <volume>231</volume>
          <issue>18-20</issue>
          <fpage>3347</fpage>
          <lpage>3356</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35039760"/>
          </comment>
          <pub-id pub-id-type="doi">10.1140/epjs/s11734-022-00436-6</pub-id>
          <pub-id pub-id-type="medline">35039760</pub-id>
          <pub-id pub-id-type="pii">436</pub-id>
          <pub-id pub-id-type="pmcid">PMC8756170</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>DQ</given-names>
            </name>
            <name name-style="western">
              <surname>Vu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>AT</given-names>
            </name>
          </person-group>
          <article-title>BERTweet: A pre-trained language model for English tweets</article-title>
          <source>Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing: System Demonstrations</source>
          <year>2020</year>
          <fpage>9</fpage>
          <lpage>14</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2020.emnlp-demos.2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yoon</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>So</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>BioBERT: a pre-trained biomedical language representation model for biomedical text mining</article-title>
          <source>Bioinformatics</source>
          <year>2020</year>
          <month>02</month>
          <day>15</day>
          <volume>36</volume>
          <issue>4</issue>
          <fpage>1234</fpage>
          <lpage>1240</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31501885"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btz682</pub-id>
          <pub-id pub-id-type="medline">31501885</pub-id>
          <pub-id pub-id-type="pii">5566506</pub-id>
          <pub-id pub-id-type="pmcid">PMC7703786</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rasmy</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Xiang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhi</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Med-BERT: pretrained contextualized embeddings on large-scale structured electronic health records for disease prediction</article-title>
          <source>NPJ Digit Med</source>
          <year>2021</year>
          <month>05</month>
          <day>20</day>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>86</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-021-00455-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-021-00455-y</pub-id>
          <pub-id pub-id-type="medline">34017034</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-021-00455-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC8137882</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wawrzuta</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Jaworski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gotlib</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Panczyk</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>What arguments against COVID-19 vaccines run on Facebook in Poland: content analysis of comments</article-title>
          <source>Vaccines (Basel)</source>
          <year>2021</year>
          <month>05</month>
          <day>10</day>
          <volume>9</volume>
          <issue>5</issue>
          <fpage>481</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=vaccines9050481"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/vaccines9050481</pub-id>
          <pub-id pub-id-type="medline">34068500</pub-id>
          <pub-id pub-id-type="pii">vaccines9050481</pub-id>
          <pub-id pub-id-type="pmcid">PMC8150815</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kalichman</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Eaton</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Earnshaw</surname>
              <given-names>VA</given-names>
            </name>
            <name name-style="western">
              <surname>Brousseau</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Faster than warp speed: early attention to COVD-19 by anti-vaccine groups on Facebook</article-title>
          <source>J Public Health (Oxf)</source>
          <year>2022</year>
          <month>03</month>
          <day>07</day>
          <volume>44</volume>
          <issue>1</issue>
          <fpage>e96</fpage>
          <lpage>e105</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33837428"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/pubmed/fdab093</pub-id>
          <pub-id pub-id-type="medline">33837428</pub-id>
          <pub-id pub-id-type="pii">6218921</pub-id>
          <pub-id pub-id-type="pmcid">PMC8083299</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Law</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cheung</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kong</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Comparing public sentiment toward COVID-19 vaccines across Canadian cities: analysis of comments on Reddit</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>09</month>
          <day>24</day>
          <volume>23</volume>
          <issue>9</issue>
          <fpage>e32685</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/9/e32685/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/32685</pub-id>
          <pub-id pub-id-type="medline">34519654</pub-id>
          <pub-id pub-id-type="pii">v23i9e32685</pub-id>
          <pub-id pub-id-type="pmcid">PMC8477909</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Raoult</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Coronavirus: Towards a Way Out of the Crisis?</article-title>
          <source>Mediterranean Infection</source>
          <year>2020</year>
          <month>02</month>
          <day>25</day>
          <access-date>2021-08-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mediterranee-infection.com/coronavirus-vers-une-sortie-de-crise/">https://www.mediterranee-infection.com/coronavirus-vers-une-sortie-de-crise/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gautret</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Lagier</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Parola</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hoang</surname>
              <given-names>VT</given-names>
            </name>
            <name name-style="western">
              <surname>Meddeb</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mailhe</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Doudier</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Courjon</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Giordanengo</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Vieira</surname>
              <given-names>VE</given-names>
            </name>
            <name name-style="western">
              <surname>Tissot Dupont</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Honoré</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Colson</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chabrière</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>La Scola</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Rolain</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Brouqui</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Raoult</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Hydroxychloroquine and azithromycin as a treatment of COVID-19: results of an open-label non-randomized clinical trial</article-title>
          <source>Int J Antimicrob Agents</source>
          <year>2020</year>
          <month>07</month>
          <volume>56</volume>
          <issue>1</issue>
          <fpage>105949</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32205204"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijantimicag.2020.105949</pub-id>
          <pub-id pub-id-type="medline">32205204</pub-id>
          <pub-id pub-id-type="pii">S0924-8579(20)30099-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC7102549</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>López-Medina</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>López</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hurtado</surname>
              <given-names>IC</given-names>
            </name>
            <name name-style="western">
              <surname>Dávalos</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Ramirez</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Martínez</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Díazgranados</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Oñate</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Chavarriaga</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Herrera</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Parra</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Libreros</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Jaramillo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Avendaño</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Toro</surname>
              <given-names>DF</given-names>
            </name>
            <name name-style="western">
              <surname>Torres</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lesmes</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Rios</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Caicedo</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Effect of ivermectin on time to resolution of symptoms among adults with mild COVID-19: a randomized clinical trial</article-title>
          <source>JAMA</source>
          <year>2021</year>
          <month>04</month>
          <day>13</day>
          <volume>325</volume>
          <issue>14</issue>
          <fpage>1426</fpage>
          <lpage>1435</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33662102"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jama.2021.3071</pub-id>
          <pub-id pub-id-type="medline">33662102</pub-id>
          <pub-id pub-id-type="pii">2777389</pub-id>
          <pub-id pub-id-type="pmcid">PMC7934083</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Oldenburg</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Pinsky</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Brogdon</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ruder</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Nyatigo</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Cook</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Hinterwirth</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lebas</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Redd</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Porco</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Lietman</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Arnold</surname>
              <given-names>BF</given-names>
            </name>
            <name name-style="western">
              <surname>Doan</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Effect of oral azithromycin vs placebo on COVID-19 symptoms in outpatients with SARS-CoV-2 infection: a randomized clinical trial</article-title>
          <source>JAMA</source>
          <year>2021</year>
          <month>08</month>
          <day>10</day>
          <volume>326</volume>
          <issue>6</issue>
          <fpage>490</fpage>
          <lpage>498</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34269813"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jama.2021.11517</pub-id>
          <pub-id pub-id-type="medline">34269813</pub-id>
          <pub-id pub-id-type="pii">2782166</pub-id>
          <pub-id pub-id-type="pmcid">PMC8285753</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Massey</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Leader</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yom-Tov</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Budenz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fisher</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Klassen</surname>
              <given-names>AC</given-names>
            </name>
          </person-group>
          <article-title>Applying multiple data collection tools to quantify human papillomavirus vaccine communication on Twitter</article-title>
          <source>J Med Internet Res</source>
          <year>2016</year>
          <month>12</month>
          <day>05</day>
          <volume>18</volume>
          <issue>12</issue>
          <fpage>e318</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2016/12/e318/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.6670</pub-id>
          <pub-id pub-id-type="medline">27919863</pub-id>
          <pub-id pub-id-type="pii">v18i12e318</pub-id>
          <pub-id pub-id-type="pmcid">PMC5168526</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="web">
          <article-title>thepanacealab / covid19_twitter</article-title>
          <source>GitHub</source>
          <access-date>2023-02-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/thepanacealab/covid19_twitter">https://github.com/thepanacealab/covid19_twitter</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="web">
          <article-title>ChristelDG / Covid_Vax_Tweet_Classif</article-title>
          <source>GitHub</source>
          <access-date>2023-02-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/ChristelDG/Covid_Vax_Tweet_Classif">https://github.com/ChristelDG/Covid_Vax_Tweet_Classif</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
