<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v27i1e66098</article-id>
      <article-id pub-id-type="pmid">40306628</article-id>
      <article-id pub-id-type="doi">10.2196/66098</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Use of Retrieval-Augmented Large Language Model for COVID-19 Fact-Checking: Development and Usability Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Coristine</surname>
            <given-names>Andrew</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Hang</surname>
            <given-names>Ching Nam</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Nabeel</surname>
            <given-names>Ismail</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Hai</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution/>
            <institution>School of Economics and Management</institution>
            <institution>Shanghai University of Sport</institution>
            <addr-line>650 Hengren Road</addr-line>
            <addr-line>Yangpu District</addr-line>
            <addr-line>Shanghai, 200000</addr-line>
            <country>China</country>
            <phone>86 13816490872</phone>
            <email>lihai1107@hotmail.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2510-5103</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>Jingyi</given-names>
          </name>
          <degrees>MA</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4555-0797</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Ji</surname>
            <given-names>Mengmeng</given-names>
          </name>
          <degrees>MBBS, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1205-0369</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>Yuyi</given-names>
          </name>
          <degrees>MB, MPH</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7625-810X</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>An</surname>
            <given-names>Ruopeng</given-names>
          </name>
          <degrees>MPP, PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9632-0209</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>School of Economics and Management</institution>
        <institution>Shanghai University of Sport</institution>
        <addr-line>Shanghai</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Surgery</institution>
        <institution>Division of Public Health Sciences</institution>
        <institution>Washington University School of Medicine in St. Louis</institution>
        <addr-line>St. Louis, MO</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Division of Computational and Data Sciences</institution>
        <institution>Washington University in St. Louis</institution>
        <addr-line>St. Louis, MO</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Constance and Martin Silver Center on Data Science and Social Equity</institution>
        <institution>Silver School of Social Work</institution>
        <institution>New York University</institution>
        <addr-line>New York, NY</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Hai Li <email>lihai1107@hotmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2025</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>30</day>
        <month>4</month>
        <year>2025</year>
      </pub-date>
      <volume>27</volume>
      <elocation-id>e66098</elocation-id>
      <history>
        <date date-type="received">
          <day>3</day>
          <month>9</month>
          <year>2024</year>
        </date>
        <date date-type="rev-request">
          <day>29</day>
          <month>11</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>18</day>
          <month>12</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>28</day>
          <month>2</month>
          <year>2025</year>
        </date>
      </history>
      <copyright-statement>©Hai Li, Jingyi Huang, Mengmeng Ji, Yuyi Yang, Ruopeng An. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 30.04.2025.</copyright-statement>
      <copyright-year>2025</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2025/1/e66098" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The COVID-19 pandemic has been accompanied by an “infodemic,” where the rapid spread of misinformation has exacerbated public health challenges. Traditional fact-checking methods, though effective, are time-consuming and resource-intensive, limiting their ability to combat misinformation at scale. Large language models (LLMs) such as GPT-4 offer a more scalable solution, but their susceptibility to generating hallucinations—plausible yet incorrect information—compromises their reliability.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to enhance the accuracy and reliability of COVID-19 fact-checking by integrating a retrieval-augmented generation (RAG) system with LLMs, specifically addressing the limitations of hallucination and context inaccuracy inherent in stand-alone LLMs.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We constructed a context dataset comprising approximately 130,000 peer-reviewed papers related to COVID-19 from PubMed and Scopus. This dataset was integrated with GPT-4 to develop multiple RAG-enhanced models: the naïve RAG, Lord of the Retrievers (LOTR)–RAG, corrective RAG (CRAG), and self-RAG (SRAG). The RAG systems were designed to retrieve relevant external information, which was then embedded and indexed in a vector store for similarity searches. One real-world dataset and one synthesized dataset, each containing 500 claims, were used to evaluate the performance of these models. Each model’s accuracy, <italic>F</italic><sub>1</sub>-score, precision, and sensitivity were compared to assess their effectiveness in reducing hallucination and improving fact-checking accuracy.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The baseline GPT-4 model achieved an accuracy of 0.856 on the real-world dataset. The naïve RAG model improved this to 0.946, while the LOTR-RAG model further increased accuracy to 0.951. The CRAG and SRAG models outperformed all others, achieving accuracies of 0.972 and 0.973, respectively. The baseline GPT-4 model reached an accuracy of 0.960 on the synthesized dataset. The naïve RAG model increased this to 0.972, and the LOTR-RAG, CRAG, and SRAG models achieved an accuracy of 0.978. These findings demonstrate that the RAG-enhanced models consistently maintained high accuracy levels, closely mirroring ground-truth labels and significantly reducing hallucinations. The CRAG and SRAG models also provided more detailed and contextually accurate explanations, further establishing the superiority of agentic RAG frameworks in delivering reliable and precise fact-checking outputs across diverse datasets.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The integration of RAG systems with LLMs substantially improves the accuracy and contextual relevance of automated fact-checking. By reducing hallucinations and enhancing transparency by citing retrieved sources, this method holds significant promise for rapid, reliable information verification to combat misinformation during public health crises.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>large language model</kwd>
        <kwd>misinformation</kwd>
        <kwd>disinformation</kwd>
        <kwd>fact-checking</kwd>
        <kwd>COVID-19</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>ChatGPT</kwd>
        <kwd>natural language processing</kwd>
        <kwd>machine learning</kwd>
        <kwd>SARS-CoV-2</kwd>
        <kwd>coronavirus</kwd>
        <kwd>respiratory</kwd>
        <kwd>infectious</kwd>
        <kwd>pulmonary</kwd>
        <kwd>pandemic</kwd>
        <kwd>infodemic</kwd>
        <kwd>retrieval-augmented generation</kwd>
        <kwd>accuracy</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>The COVID-19 pandemic has been accompanied by an “infodemic,” characterized by the rapid spread of misinformation and disinformation, significantly undermining public health efforts [<xref ref-type="bibr" rid="ref1">1</xref>]. Misinformation refers to the unintentional spread of incorrect or misleading information [<xref ref-type="bibr" rid="ref2">2</xref>], while disinformation involves deliberately disseminating false information to deceive [<xref ref-type="bibr" rid="ref3">3</xref>]. Both phenomena contribute to disseminating inaccurate health information during crises such as the COVID-19 pandemic, leading to high-risk behaviors and overwhelming public health systems [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
      <p>Fact-checking is crucial to combat health misinformation and disinformation. During the early stages of COVID-19, from January to March 2020, fact-checking related to COVID-19 increased by over 900% [<xref ref-type="bibr" rid="ref5">5</xref>]. This fact-checking primarily addressed topics such as illness, transmission and mortality rates, control measures, treatment options, and the causes of the disease [<xref ref-type="bibr" rid="ref6">6</xref>]. For example, rapid and widespread claims regarding substances such as lemon or bleach as cures for COVID-19 required prompt fact-checking to prevent adverse consequences.</p>
      <p>Conventional COVID-19 fact-checking methods have several notable drawbacks [<xref ref-type="bibr" rid="ref7">7</xref>]. Obtaining fact-checking directly from human experts or scientists can be time-consuming and challenging. The emergence of tools based on large language models (LLMs), such as OpenAI’s ChatGPT, has the potential to offer more efficient and convenient COVID-19 fact-checking than human checking. However, they also tend to generate plausible but incorrect or nonsensical information not grounded in the input data or real-world knowledge, commonly referred to as hallucinations [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. Hallucinations can occur due to several reasons. First, LLMs may generate incorrect information because they rely heavily on the patterns and associations found in their training data, which can be subject to biases, inaccuracies, and gaps in the original data sources [<xref ref-type="bibr" rid="ref10">10</xref>]. Second, LLMs lack real-world understanding and contextual awareness, meaning they do not possess the ability to verify facts against actual events or comprehend nuanced contexts [<xref ref-type="bibr" rid="ref11">11</xref>]. In addition, the inherent probabilistic nature of LLMs can result in generating outputs that are statistically plausible but factually incorrect [<xref ref-type="bibr" rid="ref12">12</xref>]. Hallucinations significantly undermine the reliability of LLMs in identifying and correcting disinformation and misinformation, posing a severe challenge to their effectiveness in safeguarding public health information during the COVID-19 pandemic.</p>
      <p>Retrieval-augmented generation (RAG) is a state-of-the-art technique that enhances LLMs by integrating external data retrieval, improving factual accuracy, and reducing costs [<xref ref-type="bibr" rid="ref13">13</xref>]. By retrieving relevant information from external sources and incorporating it as contextual input, RAG effectively mitigates the issue of hallucinations in LLMs [<xref ref-type="bibr" rid="ref14">14</xref>]. This method also addresses the need for updated external knowledge without requiring costly training or fine-tuning, making it a practical solution for maintaining the reliability and relevance of LLMs in dynamic information environments [<xref ref-type="bibr" rid="ref15">15</xref>].</p>
      <p>This study aims to evaluate the effectiveness of the RAG system in enhancing the performance of LLMs for COVID-19 fact-checking. By integrating a contextual dataset of about 130,000 peer-reviewed papers on COVID-19 with GPT-4 as the base model, we assessed the performance of various RAG-equipped models. Our research contributions follow. First, we developed a novel RAG-equipped LLMs method that significantly reduces both financial and time costs compared with conventional COVID-19 fact-checking approaches. Second, RAG-equipped LLMs enhance the reliability of COVID-19 fact-checking by providing specific explanations and references from peer-reviewed journals, effectively reducing hallucinations and external factual errors in LLMs. Finally, based on these promising results, this study could pave the way for developing a targeted web application for COVID-19 fact-checking designed to improve individuals’ understanding of accurate health information and support public health initiatives in combating misinformation.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data</title>
        <p>First, we constructed a context dataset for the RAG system by searching for “COVID-19” and “SARS-CoV-2” within the PubMed and Scopus databases. This dataset comprises 126,984 papers published in peer-reviewed journals between January 1, 2020, and January 1, 2024. About 31% (39,365/126,984) of the included papers were published in 2021 or 2022, and 22% (27,936/126,984) were published in 2023, which ensured that the dataset includes up-to-date and matured insights into COVID-19. Our RAG system leveraged this dataset as external knowledge to provide reliable and accurate COVID-19 fact-checking based on academic references.</p>
        <p>To evaluate the RAG system, we compiled two datasets of COVID-19–related claims (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The first dataset comprises 500 claims from social media posts and news outlets obtained via Kaggle (founded in 2010 by Anthony Goldbloom and Jeremy Howard and acquired by Google in 2017). The second dataset consists of 500 synthesized claims generated by GPT-4 using the context dataset of peer-reviewed academic papers. Both datasets were balanced, with 50% of the claims being true and 50% false. These datasets were used to access model performance. <xref ref-type="table" rid="table1">Table 1</xref> provides examples of both true and false claims.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Examples of claims of COVID-19.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="900"/>
            <col width="0"/>
            <col width="70"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Type and example claims of COVID-19</td>
                <td>Label</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="4">
                  <bold>Real-world dataset</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Drinking methanol, ethanol, or bleach will not prevent or cure COVID-19 and can be very dangerous.</td>
                <td colspan="2">True</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Most people who contract COVID-19 will recover.</td>
                <td colspan="2">True</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Avocado and mint tea cure coronavirus.</td>
                <td colspan="2">False</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Chewing raw onions can prevent COVID-19.</td>
                <td colspan="2">False</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Synthesized dataset</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Antifibrotic therapies are being considered to manage progressive pulmonary fibrosis observed in some severe cases of COVID-19.</td>
                <td colspan="2">True</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Confusion or a sense of disorientation has been documented in patients with COVID-19, especially in older people.</td>
                <td colspan="2">True</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Smoking and long-term exposure to second-hand smoke are not associated with increased susceptibility to acute COVID-19 infection.</td>
                <td colspan="2">False</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>IL-6<sup>a</sup> receptor antagonists are ineffective in treating the cytokine release syndrome associated with COVID-19.</td>
                <td colspan="2">False</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>IL-6: Interleukin-6.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Data Preprocessing</title>
        <p><xref rid="figure1" ref-type="fig">Figure 1</xref> illustrates the data preprocessing workflow for the RAG system. We extracted each academic paper’s abstract, title, authors, published journal, and publication date. Due to the well-structured nature of the academic paper’s abstract, we can ensure accuracy while avoiding copyright issues and minimizing computational costs using the extracted information rather than the full-text papers. The abstracts were segmented into smaller chunks with appropriate length and overlapping, which served as the primary input for further processing. The remaining details were treated as contextual metadata, which complements the abstract chunks during the retrieval process. Each segmented chunk was transformed into a numerical format known as a vector. These vectors are mathematical representations that enable computational operations. Vectors were stored in the vector store index within the Qdrant database, which was designed for similarity searches. The system used maximal marginal relevance technology to optimize the retrieval process by balancing relevance and diversity in the retrieved results.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Workflow of data preprocessing.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e66098_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Model Architecture</title>
        <sec>
          <title>Base Model</title>
          <p>We used OpenAI’s GPT-4 as the foundational model for the RAG system. In the corrective RAG (CRAG) and self-RAG (SRAG) workflow, GPT-4 additionally functions as a grader or rewriter model.</p>
        </sec>
        <sec>
          <title>Embedding Models</title>
          <p>We used two distinct embedding models in the RAG systems. The “text-embedding-ada-002” model provided by OpenAI was used across all RAG systems, and the “NeuML/pubmedbert-base-embeddings” model from Hugging Face was specifically applied in the LOTR-RAG system.</p>
        </sec>
        <sec>
          <title>Naïve RAG System</title>
          <p>The naïve RAG system combines the parametric memory of a pretrained LLM with the nonparametric memory of a vector index containing specific external knowledge [<xref ref-type="bibr" rid="ref13">13</xref>].</p>
          <p><xref rid="figure2" ref-type="fig">Figure 2</xref> shows that the naïve RAG workflow begins with embedding the input query into a vector, followed by a similarity search within the vector store to retrieve the most relevant contexts. The LLM then conducts fact-checking on each COVID-19 claim based on these retrieved contexts, ensuring information retrieval accuracy and simultaneously providing reliable explanations and references.</p>
          <p>Despite its effectiveness, the naïve RAG has limitations, such as the “lost in the middle” phenomenon, where the LLM’s performance deteriorates when handling information located in the middle of lengthy contexts [<xref ref-type="bibr" rid="ref16">16</xref>]. To address this issue, we used the Lord of the Retrievers (LOTR)–RAG system [<xref ref-type="bibr" rid="ref17">17</xref>].</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Workflow of naïve retrieval-augmented generation. LLM: large language model.</p>
            </caption>
            <graphic xlink:href="jmir_v27i1e66098_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>LOTR-RAG System</title>
          <p>As <xref rid="figure3" ref-type="fig">Figure 3</xref> illustrates, the LOTR-RAG system enhances the relevance between context and query by using a merging retriever that integrates two distinct embedding models. This approach allows for creating two vector store indices, each associated with our context dataset, leading to more coherent and accurate responses than the naïve RAG system [<xref ref-type="bibr" rid="ref18">18</xref>].</p>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Workflow of Lord of the Retrievers–retrieval-augmented generation. LLM: large language model.</p>
            </caption>
            <graphic xlink:href="jmir_v27i1e66098_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <p>However, for more complex tasks such as fact-checking, the LOTR-RAG system may still be limited by integrating a single LLM and RAG system [<xref ref-type="bibr" rid="ref19">19</xref>]. To overcome these limitations, we introduced agentic frameworks—CRAG and SRAG—to further enhance the reliability of fact-checking.</p>
        </sec>
        <sec>
          <title>CRAG System</title>
          <p><xref rid="figure4" ref-type="fig">Figure 4</xref> illustrates the CRAG [<xref ref-type="bibr" rid="ref20">20</xref>] workflow. GPT-4 functions as a grader in this framework, evaluating the input, retrieval, and generation processes. The grader decides whether to retrieve information from the vector store or use the Tavily Search application programming interface, an LLM-optimized search engine developed by Tavily, which efficiently aggregates and ranks data from multiple sources for fast and consistent results [<xref ref-type="bibr" rid="ref21">21</xref>]. During the retrieval process, the grader assesses the relevance of the documents, and irrelevant documents are replaced with those obtained via web search. After answer generation, the grader verifies whether the answer is helpful for the fact-checking task and supported by the retrieval documents. If not, additional information is retrieved, or the answer is regenerated until it meets the criteria.</p>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>Workflow of corrective retrieval-augmented generation.</p>
            </caption>
            <graphic xlink:href="jmir_v27i1e66098_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>SRAG System</title>
          <p><xref rid="figure5" ref-type="fig">Figure 5</xref> illustrates the SRAG [<xref ref-type="bibr" rid="ref22">22</xref>] framework, which uses GPT-4 as both grader and rewriter. After retrieving documents, the grader assesses their relevance to the original query. If the documents are deemed irrelevant, the rewriter reformulates the query while preserving its original semantic meaning to enhance retrieval effectiveness. This iterative process continues until the retrieved documents demonstrate high relevance to the query, at which point an answer is generated. Following answer generation, the grader evaluates whether the response adequately addresses the input query and is supported by the retrieved documents. If the answer does not meet these criteria, the framework either rewrites the query or regenerates the answer, repeating the process until a satisfactory and reliable response is achieved.</p>
          <p>By integrating agentic frameworks such as CRAG and SRAG, the reliability of COVID-19 fact-checking is significantly enhanced, as the LLM’s outputs are rigorously evaluated before being presented to the user.</p>
          <fig id="figure5" position="float">
            <label>Figure 5</label>
            <caption>
              <p>Workflow of self–retrieval-augmented generation.</p>
            </caption>
            <graphic xlink:href="jmir_v27i1e66098_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
      <sec>
        <title>Prompt Engineering</title>
        <p><xref ref-type="table" rid="table2">Table 2</xref> outlines the prompts used in this study. For answer generation, the LLM is instructed to perform COVID-19 fact-checking based on retrieved documents from the context dataset, functioning as an expert. In the agentic frameworks of CRAG and SRAG, the LLM is further directed to evaluate the quality of retrieved documents and generated answers, ensuring the robustness of the entire workflow.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Prompts using in experiments.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="150"/>
            <col width="850"/>
            <thead>
              <tr valign="top">
                <td>Objective</td>
                <td>Prompt</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Generate answers</td>
                <td>You are an expert for the COVID-19 fact-checking tasks. Based on pieces of retrieved context to detect if the claim is true or false. You will have to give me the title and author of the context you referred to in one sentence. If you don’t know the answer, just say that you don’t know. Keep the answer concise.<break/>Claim: {question}<break/>Context: {context}<break/>Answer:</td>
              </tr>
              <tr valign="top">
                <td>Grade documents</td>
                <td>You are a grader assessing relevance of a retrieved document to a user question. If the document contains keywords related to the user question, grade it as relevant. It does not need to be a stringent test. The goal is to filter out erroneous retrievals. Give a binary score “yes” or “no” score to indicate whether the document is relevant to the question. Provide the binary score as a JSON with a single key “score” and no preamble or explanation.<break/>Here is the retrieved document: {document}<break/>Here is the user question: {question}</td>
              </tr>
              <tr valign="top">
                <td>Grade answers</td>
                <td>You are a grader assessing whether an answer is useful to resolve a question. Give a binary score “yes” or “no” to indicate whether the answer is useful to resolve a question. Provide the binary score as a JSON with a single key “score” and no preamble or explanation.<break/>Here is the answer: {generation}<break/>Here is the question: {question}</td>
              </tr>
              <tr valign="top">
                <td>Rewrite claims</td>
                <td>You are a claim rewriter that converts an input claim to a better version that is optimized for vector store retrieval and fact-checking. Look at the input and try to reason about the underlying semantic intent meaning.</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>This study used preexisting public data with no identifiable information, due to them being anonymized, and therefore does not require institutional review board review per Federal Regulations for the Protection of Human Research Subjects (45CFR 46.104(d); [<xref ref-type="bibr" rid="ref23">23</xref>]).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p><xref ref-type="table" rid="table3">Table 3</xref> demonstrates the enhanced performance of our RAG-equipped GPT-4 models in COVID-19 fact-checking. The <italic>P</italic> value from the confusion matrix, used to evaluate if the model’s performance significantly differs from random guessing, was &#60;.001 for all cases (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). The integration of the RAG system notably improved the LLM’s performances on the real-world dataset. Specifically, the baseline GPT-4 model achieved an accuracy of 0.856, which increased to 0.946 with the implementation of the naïve RAG system. Further improvements were observed with the LOTR-RAG model reaching an accuracy of 0.951. The CRAG and SRAG models achieved even higher accuracies of 0.972 and 0.973, respectively. These results underscore the consistent and substantial accuracy gains achieved by each RAG-equipped model, bringing their performance nearly in line with the ground-truth labels.</p>
      <table-wrap position="float" id="table3">
        <label>Table 3</label>
        <caption>
          <p>Results of COVID-19 fact-checking.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="370"/>
          <col width="150"/>
          <col width="150"/>
          <col width="150"/>
          <col width="150"/>
          <thead>
            <tr valign="top">
              <td colspan="2">Target dataset and models</td>
              <td>Accuracy</td>
              <td><italic>F</italic><sub>1</sub>-score</td>
              <td>PPV<sup>a</sup></td>
              <td>Sensitivity</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="6">
                <bold>Real-world dataset</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>GPT-4</td>
              <td>0.856</td>
              <td>0.849</td>
              <td>0.894</td>
              <td>0.894</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Naïve RAG<sup>b</sup></td>
              <td>0.946</td>
              <td>0.945</td>
              <td>0.970</td>
              <td>0.920</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>LOTR-RAG<sup>c</sup></td>
              <td>0.951</td>
              <td>0.952</td>
              <td>0.959</td>
              <td>0.944</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>CRAG<sup>d</sup></td>
              <td>0.972</td>
              <td>0.972</td>
              <td>0.980</td>
              <td>0.965</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>SRAG<sup>e</sup></td>
              <td>0.973</td>
              <td>0.974</td>
              <td>0.968</td>
              <td>0.980</td>
            </tr>
            <tr valign="top">
              <td colspan="6">
                <bold>Synthesized dataset</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>GPT-4</td>
              <td>0.960</td>
              <td>0.961</td>
              <td>0.942</td>
              <td>0.980</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Naïve RAG</td>
              <td>0.972</td>
              <td>0.973</td>
              <td>0.947</td>
              <td>1.000</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>LOTR-RAG</td>
              <td>0.978</td>
              <td>0.978</td>
              <td>0.965</td>
              <td>0.992</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>CRAG</td>
              <td>0.978</td>
              <td>0.978</td>
              <td>0.972</td>
              <td>0.984</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>SRAG</td>
              <td>0.978</td>
              <td>0.978</td>
              <td>0.969</td>
              <td>0.988</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table3fn1">
            <p><sup>a</sup>PPV: positive predictive value.</p>
          </fn>
          <fn id="table3fn2">
            <p><sup>b</sup>RAG: retrieval-augmented generation.</p>
          </fn>
          <fn id="table3fn3">
            <p><sup>c</sup>LOTR-RAG: Lord of the Retrievers</p>
          </fn>
          <fn id="table3fn4">
            <p><sup>d</sup>CRAG: corrective retrieval-augmented generation.</p>
          </fn>
          <fn id="table3fn5">
            <p><sup>e</sup>SRAG: self–retrieval-augmented generation .</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <p>The RAG system similarly enhances LLM’s performance on the synthesized dataset. The baseline GPT-4 model achieved an accuracy of 0.960, which improved to 0.972 with the naïve RAG system. The LOTR-RAG, CRAG, and SRAG models all attained an accuracy of 0.978. These results confirm that the RAG-equipped models consistently achieve high accuracy levels, closely mirroring the ground truth, and demonstrate the system’s robust performance across different datasets.</p>
      <p><xref ref-type="table" rid="table4">Table 4</xref> illustrates two examples of RAG systems in enhancing COVID-19 fact-checking accuracy. The baseline GPT-4 model struggled with identifying the facts behind COVID-19 claims, often producing hallucinations. Integrating naïve RAG significantly improved the model’s performance by providing more accurate and contextually relevant responses backed by an external context dataset (ie, academic papers). Further improvements were observed with the LOTR-RAG system, which offered even more precise explanations. The CRAG and SRAG models excelled, delivering the most detailed and specific responses among all models, demonstrating the advanced RAG systems’ superiority in generating accurate and reliable COVID-19 fact-checking outputs.</p>
      <table-wrap position="float" id="table4">
        <label>Table 4</label>
        <caption>
          <p>Examples of COVID-19 fact-checking.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="100"/>
          <col width="450"/>
          <col width="450"/>
          <thead>
            <tr valign="top">
              <td>Model</td>
              <td>Response to real claim: hydroxychloroquine not safe or effective for preventing or treating COVID-19 (true)</td>
              <td>Response to false claim: scientists confirmed COVID-19 was transmitted directly from pangolins to humans (false)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>GPT-4</td>
              <td>False</td>
              <td>False</td>
            </tr>
            <tr valign="top">
              <td>Naïve RAG<sup>a</sup></td>
              <td>True, several studies and clinical trials have investigated hydroxychloroquine's use for COVID-19, with varying results on its efficacy and safety.</td>
              <td>False. While pangolins were initially considered as potential intermediate hosts, it is generally accepted that SARS-CoV-2 has a probable bat origin, and the exact pathway to human transmission remains undetermined.</td>
            </tr>
            <tr valign="top">
              <td>CRAG<sup>b</sup></td>
              <td>Hydroxychloroquine is not effective in preventing or treating COVID-19, according to multiple studies. These include “Hydroxychloroquine or Chloroquine for Treatment or Prophylaxis of COVID-19: A Living Systematic Review” by A. V. Hernandez et al. 2020, and “A Randomized Trial of Hydroxychloroquine as Postexposure Prophylaxis for Covid-19” by D. R. Boulware et al. 2020. Despite its effectiveness in treating other conditions, it fails to prevent COVID-19 in exposed individuals or treat the disease.</td>
              <td>Based on the given context, the claim is true. The potential for another wave of COVID-19 infections is anticipated by various disease experts, due to new variants emerging. This is referenced in the documents “Predicting the development trend of the second wave of COVID-19 in five European countries” by J. Lei, M. Li, X. Wang and “The Impact of the COVID-19 Pandemic on Health-Care Delivery System for Other Diseases and Antimicrobial Resistance Threat in India” by D. Chakraborty, A. Majumdar, F. Debnath, S. Naskar, and S. Dutta. The specifics of the potential wave, including its scale and severity, are still uncertain.</td>
            </tr>
            <tr valign="top">
              <td>LOTR-RAG<sup>c</sup></td>
              <td>True. Based on the context provided, there is no scientific evidence to support the claim that hydroxychloroquine cures COVID-19 or is used for radiation sickness. The document titled “It is time to drop hydroxychloroquine from our COVID-19 armamentarium” by T. Kashour and I. M. Tleyjeh indicates that subsequent randomized trials revealed a lack of efficacy of hydroxychloroquine in improving the outcomes of COVID-19.</td>
              <td>False. No definitive evidence directly links pangolins as the intermediate host transmitting SARS-CoV-2 to humans. According to “COVID-19—Zoonosis or Emerging Infectious Disease?” by N. Haider et al., 2020, no cases of natural transmission from wild or domesticated animals have been confirmed as of their study, and SARS-CoV-2 does not meet the WHO definition of zoonoses.</td>
            </tr>
            <tr valign="top">
              <td>SRAG<sup>d</sup></td>
              <td>The claim that Hydroxychloroquine is not safe or effective for preventing or treating COVID-19 is TRUE. This is supported by a systematic review and meta-analysis conducted by Tanni et al (2021), which states that the use of Hydroxychloroquine increased the risk of adverse events and its use for prophylaxis of SARS-CoV-2 infection or treatment of mild COVID-19 is not recommended. Furthermore, M. Zepperi in 2023 warned of the drug's potential to cause retinal toxicity, leading to vision impairment or loss.</td>
              <td>The claim that COVID-19 was directly transmitted to humans from pangolins is not confirmed. The context from the document “Analysis of the hosts and transmission paths of SARS-CoV-2 in the COVID-19 outbreak” by R. Dong et al suggests a possible transmission path from bats to pangolins to humans, but does not confirm direct transmission to humans from pangolins. The genetic analysis indicates a close relationship, implying an intermediary host, but it does not establish direct transmission to humans.</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table4fn1">
            <p><sup>a</sup>RAG: retrieval-augmented generation.</p>
          </fn>
          <fn id="table4fn2">
            <p><sup>b</sup>CRAG: corrective retrieval-augmented generation.</p>
          </fn>
          <fn id="table4fn3">
            <p><sup>c</sup>LOTR-RAG: Lord of the Retrievers</p>
          </fn>
          <fn id="table4fn4">
            <p><sup>d</sup>SRAG: self–retrieval-augmented generation .</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <p>In addition, <xref ref-type="table" rid="table5">Table 5</xref> presents failure cases of our agentic RAG systems. While there are no instances of false fact-checking, some cases show the RAG system cannot find answers or retrieve mixed results. When relevant information cannot be retrieved, the system responds with “I don’t know” instead of fabricating answers. If mixed results are found, the system reports them accordingly. Therefore, CRAG and SRAG help users access relevant information and exercise caution with unclear claims, even if the full fact-checking process cannot be completed. We will discuss the limitations of the RAG-enhanced fact-checking system in the Discussion section.</p>
      <table-wrap position="float" id="table5">
        <label>Table 5</label>
        <caption>
          <p>Illustrative cases of fact-checking failures in an agentic RAG<sup>a</sup>.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="120"/>
          <col width="280"/>
          <col width="600"/>
          <thead>
            <tr valign="top">
              <td>RAG system</td>
              <td>Claim (ground truth)</td>
              <td>Response</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>CRAG<sup>b</sup></td>
              <td>Use of hydroxychloroquine alone as a treatment for COVID-19 is associated with a higher risk of death. (true)</td>
              <td>The claim is not unequivocally true or false since the studies show mixed results. S Arshad et al’s “Treatment with hydroxychloroquine, azithromycin, and combination in patients hospitalized with COVID-19” suggests that hydroxychloroquine alone might reduce COVID-19 mortality. Conversely, A H Elshafie et al in “Ivermectin role in COVID-19 treatment (IRICT): single-center, adaptive, randomized, double-blind, placebo-controlled, clinical trial” found that hydroxychloroquine increased the 3-month mortality rates. Finally, a third document indicates that its usage potentially increases the risk of death from COVID-19. Therefore, the claim is both supported and contradicted depending on the referred study.</td>
            </tr>
            <tr valign="top">
              <td>CRAG</td>
              <td>Homemade oxygen devices cannot help patients with COVID-19 at home. (false)</td>
              <td>The claim that homemade oxygen devices cannot help patients with COVID-19 at home is too broad, as the context does not provide information specifically about homemade oxygen devices. However, Dr Connolly confirms in a paper published by <italic>The Lancet Digital Health</italic> that pulse oximeters can be a helpful tool for self-monitoring oxygen levels in individuals with mild COVID-19 at home. Homemade oxygen devices were not discussed in the provided context, thus a definitive statement about their effectiveness cannot be made. Title: “Effectiveness and safety of pulse oximetry in remote patient monitoring of patients with COVID-19: a systematic review.” Author: <italic>The Lancet Digital Health</italic>, 2022.</td>
            </tr>
            <tr valign="top">
              <td>SRAG<sup>c</sup></td>
              <td>Nonabsorptive material has been shown to be better than absorptive material for personal protective clothing when combating coronaviruses other than SARS-CoV-2. (false)</td>
              <td>The claim is not mentioned in the provided context. The context from the document “Efficacy of cloth face mask in reducing COVID-19 transmission: A literature review” by Rizki and Kurniawan only discuss the efficacy of cloth face masks compared with surgical masks in the context of COVID-19, but does not compare nonabsorptive and absorptive materials.</td>
            </tr>
            <tr valign="top">
              <td>SRAG</td>
              <td>The biological ability of bats to detect cytoplasmic DNA in their bodies helps them respond to and coexist with viruses. (true)</td>
              <td>I don’t know. The provided context does not contain information related to the ability of bats to identify intracellular DNA or their efficiency in responding to viruses.</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table5fn1">
            <p><sup>a</sup>RAG: retrieval-augmented generation.</p>
          </fn>
          <fn id="table5fn2">
            <p><sup>b</sup>CRAG: corrective retrieval-augmented generation.</p>
          </fn>
          <fn id="table5fn3">
            <p><sup>c</sup>SRAG: self–retrieval-augmented generation.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This study investigates the effectiveness of leveraging a RAG system to improve the accuracy and reliability of COVID-19 fact-checking using LLMs. Our method addresses two critical challenges: the inaccuracies and hallucinations often produced by LLMs and the high costs associated with traditional human-led fact-checking or fine-tuning methods. By integrating a vast dataset of approximately 130,000 peer-reviewed papers with GPT-4 and using an agentic RAG chain, we demonstrated significant improvements in both the accuracy and contextual relevance of the fact-checking process. Meanwhile, all of the RAG systems demonstrate cost efficiency, maintaining a low computational expense of less than US $0.08 per query in real-time applications.</p>
        <p>The spread of myths and disinformation during the COVID-19 pandemic has been a significant challenge, exacerbating public health crises by undermining trust in scientific expertise and promoting harmful behaviors [<xref ref-type="bibr" rid="ref24">24</xref>]. Traditional fact-checking methods, while effective, are often slow and resource-intensive, leading to delays in countering misinformation [<xref ref-type="bibr" rid="ref25">25</xref>]. Furthermore, the sheer volume of false information circulating on the internet makes it nearly impossible for human-led efforts to keep pace [<xref ref-type="bibr" rid="ref26">26</xref>]. Traditional approaches, such as using machine learning models to detect misinformation [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>] or fine-tuning LLMs to classify tweets into categories such as “entailment,” “neutral,” and “contradiction” [<xref ref-type="bibr" rid="ref29">29</xref>], have shown some promise. However, these methods often fall short when faced with the nuances of natural language and the complex reasoning required to debunk false claims [<xref ref-type="bibr" rid="ref30">30</xref>].</p>
        <p>The integration of RAG systems with LLMs represents a transformative step forward in automated fact-checking. RAG-enhanced models address these limitations by combining the retrieval of relevant information from vast corpora with the ability to contextualize them, providing accurate and easy-to-understand explanations during critical events, such as the United States presidential election [<xref ref-type="bibr" rid="ref31">31</xref>]. Building on this progress, our RAG system adapts and extends these capabilities to meet the rigorous demands of health care and public health domains. These fields require exceptional factual accuracy and scientifically grounded explanations to ensure reliability and trust. By leveraging peer-reviewed papers as an external knowledge source, our system achieves state-of-the-art performance in health fact-checking. Furthermore, it offers a practical, cost-effective solution compared with resource-intensive alternatives, such as fine-tuned LLMs. This makes our approach both highly efficient and easily deployable for critical real-world applications.</p>
        <p>The implications of our findings are multifaceted. First, the ability of RAG-equipped models to deliver high-accuracy fact-checking in real time could transform how misinformation is managed during public health emergencies. In response to health communication policies aimed at combating health misinformation [<xref ref-type="bibr" rid="ref32">32</xref>], our RAG-enhanced LLMs can function as web applications or browser plugins deployed across various platforms, including social media and government websites, to provide timely and reliable information to the public. Furthermore, reducing the cost and time associated with fact-checking could enable wider adoption of these technologies, particularly in low-resource settings where misinformation can have devastating consequences. Our study highlights the potential for using advanced artificial intelligence (AI) systems to combat misinformation and improve public health literacy more broadly. The ability of our models to generate detailed, evidence-based explanations means that they could be used as educational tools, helping individuals to better understand complex health information and make informed decisions. This could be particularly valuable in addressing vaccine hesitancy and other public health challenges where misinformation plays a central role.</p>
        <p>Our findings highlight the potential of AI-driven technologies in combating misinformation during pandemics and other public health crises. The success of the RAG-equipped LLMs in enhancing the accuracy and efficiency of COVID-19 fact-checking suggests that similar approaches could be adapted and refined for broader applications, including emerging infectious diseases, cancer, cardiovascular health, and dietary behaviors [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]. Future research should explore the effectiveness of knowledge-graph RAG systems and the comparative performance of fine-tuned versus RAG-equipped LLMs in enhancing automated health fact-checking. The modularity and scalability of RAG systems present opportunities for developing flexible tools tailored to specific misinformation challenges, such as vaccine safety, treatment efficacy, or preventive measures [<xref ref-type="bibr" rid="ref35">35</xref>]. Integrating these systems into digital platforms, such as social media, news outlets, and public health websites, could provide real-time, accurate information directly to the public, countering misinformation before it gains traction [<xref ref-type="bibr" rid="ref36">36</xref>]. Collaboration among AI developers, public health experts, and the integration of human feedback through a “human-in-the-loop” approach will be crucial for ensuring the ethical implementation and effectiveness of those technologies, fostering more informed and resilient societies during public health crises [<xref ref-type="bibr" rid="ref37">37</xref>].</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Despite their advantages, RAG-based LLM systems have several limitations. The external knowledge dataset derived from peer-reviewed journal papers cannot capture the entirety of academic research on COVID-19 due to limitations such as language restrictions, geographical diversity, and the lack of timely clinical insights that remain unpublished. While RAG-enhanced models improve accuracy, they are not immune to errors and biases. The quality and diversity of the academic papers directly impact the outputs of fact-checking. Misinformation generally evolves faster than peer-reviewed literature, limiting the system’s responsiveness to emerging falsehoods, which can be a limitation for real-time applications. Furthermore, the opaque nature of RAG’s decision-making reduces interpretability. Finally, the system’s effectiveness in multilingual and low-resource settings remains limited, potentially exacerbating disparities in combating health misinformation. Addressing these challenges is essential for ensuring the reliability, scalability, and equitable application of RAG-LLM fact-checking in public health.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>This study demonstrates that the integration of RAG systems with LLMs substantially improves the accuracy and contextual relevance of automated fact-checking. By addressing the challenges of LLM inaccuracies and the high costs of traditional fact-checking methods, our RAG-enhanced approach improves the factual correctness of outputs. It provides contextually rich explanations that can be widely applied in combating misinformation during public health crises.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Claims for evaluation.</p>
        <media xlink:href="jmir_v27i1e66098_app1.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 64 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Detailed results of evaluation.</p>
        <media xlink:href="jmir_v27i1e66098_app2.pdf" xlink:title="PDF File  (Adobe PDF File), 546 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CRAG</term>
          <def>
            <p>corrective retrieval-augmented generation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">LOTR</term>
          <def>
            <p>Lord of the Retrievers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">RAG</term>
          <def>
            <p>retrieval-augmented generation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">SRAG</term>
          <def>
            <p>self–retrieval-augmented generation</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>All relevant data and code used in this study are publicly available at GitHub [<xref ref-type="bibr" rid="ref38">38</xref>].</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>The conceptualization and methodology of the study were developed by RA and JH. Data curation was handled by JH, while formal analysis and validation were conducted by both JH and YY. Original draft was written by JH and YY. Supervision was provided by RA, MJ, and HL, and funding for the study was provided by HL.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>The Lancet Infectious Diseases</collab>
          </person-group>
          <article-title>The COVID-19 infodemic</article-title>
          <source>Lancet Infect Dis</source>
          <year>2020</year>
          <month>08</month>
          <volume>20</volume>
          <issue>8</issue>
          <fpage>875</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32687807"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S1473-3099(20)30565-X</pub-id>
          <pub-id pub-id-type="medline">32687807</pub-id>
          <pub-id pub-id-type="pii">S1473-3099(20)30565-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC7367666</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Borges do Nascimento</surname>
              <given-names>IJ</given-names>
            </name>
            <name name-style="western">
              <surname>Beatriz Pizarro</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Almeida</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Azzopardi-Muscat</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>André Gonçalves</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Björklund</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Novillo-Ortiz</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Infodemics and health misinformation: a systematic review of reviews</article-title>
          <source>Bull World Health Organ</source>
          <year>2022</year>
          <month>09</month>
          <day>01</day>
          <volume>100</volume>
          <issue>9</issue>
          <fpage>544</fpage>
          <lpage>561</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pmc.ncbi.nlm.nih.gov/articles/PMC9421549/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2471/blt.21.287654</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Bye</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bales</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gurdasani</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mehta</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Abba-Aji</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stuckler</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>McKee</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Understanding and neutralising covid-19 misinformation and disinformation</article-title>
          <source>BMJ</source>
          <year>2022</year>
          <month>11</month>
          <day>22</day>
          <volume>379</volume>
          <fpage>e070331</fpage>
          <pub-id pub-id-type="doi">10.1136/bmj-2022-070331</pub-id>
          <pub-id pub-id-type="medline">36414251</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wilhelm</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ballalai</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Belanger</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Benjamin</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bertrand-Ferrandis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bezbaruah</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Briand</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Brooks</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Bruns</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bucci</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Calleja</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Chiou</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Devaria</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dini</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>D'Souza</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Dunn</surname>
              <given-names>Adam G</given-names>
            </name>
            <name name-style="western">
              <surname>Eichstaedt</surname>
              <given-names>Johannes C</given-names>
            </name>
            <name name-style="western">
              <surname>Evers</surname>
              <given-names>Silvia M A A</given-names>
            </name>
            <name name-style="western">
              <surname>Gobat</surname>
              <given-names>Nina</given-names>
            </name>
            <name name-style="western">
              <surname>Gissler</surname>
              <given-names>Mika</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzales</surname>
              <given-names>Ian Christian</given-names>
            </name>
            <name name-style="western">
              <surname>Gruzd</surname>
              <given-names>Anatoliy</given-names>
            </name>
            <name name-style="western">
              <surname>Hess</surname>
              <given-names>Sarah</given-names>
            </name>
            <name name-style="western">
              <surname>Ishizumi</surname>
              <given-names>Atsuyoshi</given-names>
            </name>
            <name name-style="western">
              <surname>John</surname>
              <given-names>Oommen</given-names>
            </name>
            <name name-style="western">
              <surname>Joshi</surname>
              <given-names>Ashish</given-names>
            </name>
            <name name-style="western">
              <surname>Kaluza</surname>
              <given-names>Benjamin</given-names>
            </name>
            <name name-style="western">
              <surname>Khamis</surname>
              <given-names>Nagwa</given-names>
            </name>
            <name name-style="western">
              <surname>Kosinska</surname>
              <given-names>Monika</given-names>
            </name>
            <name name-style="western">
              <surname>Kulkarni</surname>
              <given-names>Shibani</given-names>
            </name>
            <name name-style="western">
              <surname>Lingri</surname>
              <given-names>Dimitra</given-names>
            </name>
            <name name-style="western">
              <surname>Ludolph</surname>
              <given-names>Ramona</given-names>
            </name>
            <name name-style="western">
              <surname>Mackey</surname>
              <given-names>Tim</given-names>
            </name>
            <name name-style="western">
              <surname>Mandić-Rajčević</surname>
              <given-names>Stefan</given-names>
            </name>
            <name name-style="western">
              <surname>Menczer</surname>
              <given-names>Filippo</given-names>
            </name>
            <name name-style="western">
              <surname>Mudaliar</surname>
              <given-names>Vijaybabu</given-names>
            </name>
            <name name-style="western">
              <surname>Murthy</surname>
              <given-names>Shruti</given-names>
            </name>
            <name name-style="western">
              <surname>Nazakat</surname>
              <given-names>Syed</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>Tim</given-names>
            </name>
            <name name-style="western">
              <surname>Nilsen</surname>
              <given-names>Jennifer</given-names>
            </name>
            <name name-style="western">
              <surname>Pallari</surname>
              <given-names>Elena</given-names>
            </name>
            <name name-style="western">
              <surname>Pasternak Taschner</surname>
              <given-names>Natalia</given-names>
            </name>
            <name name-style="western">
              <surname>Petelos</surname>
              <given-names>Elena</given-names>
            </name>
            <name name-style="western">
              <surname>Prinstein</surname>
              <given-names>Mitchell J</given-names>
            </name>
            <name name-style="western">
              <surname>Roozenbeek</surname>
              <given-names>Jon</given-names>
            </name>
            <name name-style="western">
              <surname>Schneider</surname>
              <given-names>Anton</given-names>
            </name>
            <name name-style="western">
              <surname>Srinivasan</surname>
              <given-names>Varadharajan</given-names>
            </name>
            <name name-style="western">
              <surname>Stevanović</surname>
              <given-names>Aleksandar</given-names>
            </name>
            <name name-style="western">
              <surname>Strahwald</surname>
              <given-names>Brigitte</given-names>
            </name>
            <name name-style="western">
              <surname>Syed Abdul</surname>
              <given-names>Shabbir</given-names>
            </name>
            <name name-style="western">
              <surname>Varaidzo Machiri</surname>
              <given-names>Sandra</given-names>
            </name>
            <name name-style="western">
              <surname>van der Linden</surname>
              <given-names>Sander</given-names>
            </name>
            <name name-style="western">
              <surname>Voegeli</surname>
              <given-names>Christopher</given-names>
            </name>
            <name name-style="western">
              <surname>Wardle</surname>
              <given-names>Claire</given-names>
            </name>
            <name name-style="western">
              <surname>Wegwarth</surname>
              <given-names>Odette</given-names>
            </name>
            <name name-style="western">
              <surname>White</surname>
              <given-names>Becky K</given-names>
            </name>
            <name name-style="western">
              <surname>Willie</surname>
              <given-names>Estelle</given-names>
            </name>
            <name name-style="western">
              <surname>Yau</surname>
              <given-names>Brian</given-names>
            </name>
            <name name-style="western">
              <surname>Purnat</surname>
              <given-names>Tina D</given-names>
            </name>
          </person-group>
          <article-title>Measuring the burden of infodemics: summary of the methods and results of the Fifth WHO Infodemic Management Conference</article-title>
          <source>JMIR Infodemiology</source>
          <year>2023</year>
          <volume>3</volume>
          <fpage>e44207</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://infodemiology.jmir.org/2023//e44207/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/44207</pub-id>
          <pub-id pub-id-type="medline">37012998</pub-id>
          <pub-id pub-id-type="pii">v3i1e44207</pub-id>
          <pub-id pub-id-type="pmcid">PMC9989916</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Harwood</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chillrud</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ananthram</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Subbiah</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>McKeown</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Check-COVID: fact-checking COVID-19 news claims with scientific evidence</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on May 29, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2305.18265"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/2023.findings-acl.888</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>EWJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>YT</given-names>
            </name>
          </person-group>
          <article-title>From pandemic to plandemic: examining the amplification and attenuation of COVID-19 misinformation on social media</article-title>
          <source>Soc Sci Med</source>
          <year>2023</year>
          <month>07</month>
          <volume>328</volume>
          <fpage>115979</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37245261"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.socscimed.2023.115979</pub-id>
          <pub-id pub-id-type="medline">37245261</pub-id>
          <pub-id pub-id-type="pii">S0277-9536(23)00336-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC10200718</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kolluri</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Murthy</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>COVID-19 misinformation detection: machine-learned solutions to the infodemic</article-title>
          <source>JMIR Infodemiology</source>
          <year>2022</year>
          <volume>2</volume>
          <issue>2</issue>
          <fpage>e38756</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://infodemiology.jmir.org/2022/2/e38756/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/38756</pub-id>
          <pub-id pub-id-type="medline">37113446</pub-id>
          <pub-id pub-id-type="pii">v2i2e38756</pub-id>
          <pub-id pub-id-type="pmcid">PMC9987189</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Augenstein</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Baldwin</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Cha</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chakraborty</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ciampaglia</surname>
              <given-names>GL</given-names>
            </name>
            <name name-style="western">
              <surname>Corney</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>DiResta</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ferrara</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Hale</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Halevy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hovy</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Menczer</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Miguez</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Nakov</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Scheufele</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zagni</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Factuality challenges in the era of large language models and opportunities for fact-checking</article-title>
          <source>Nat Mach Intell</source>
          <year>2024</year>
          <month>08</month>
          <day>22</day>
          <volume>6</volume>
          <issue>8</issue>
          <fpage>852</fpage>
          <lpage>863</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s42256-024-00881-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s42256-024-00881-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Frieske</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Su</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ishii</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bang</surname>
              <given-names>YJ</given-names>
            </name>
            <name name-style="western">
              <surname>Madotto</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fung</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Survey of hallucination in natural language generation</article-title>
          <source>ACM Comput Surv</source>
          <year>2023</year>
          <month>03</month>
          <day>03</day>
          <volume>55</volume>
          <issue>12</issue>
          <fpage>1</fpage>
          <lpage>38</lpage>
          <pub-id pub-id-type="doi">10.1145/3571730</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ullah</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Parwani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Baig</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Challenges and barriers of using large language models (LLM) such as ChatGPT for diagnostic medicine with a focus on digital pathology - a recent scoping review</article-title>
          <source>Diagn Pathol</source>
          <year>2024</year>
          <month>02</month>
          <day>27</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>43</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://diagnosticpathology.biomedcentral.com/articles/10.1186/s13000-024-01464-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13000-024-01464-7</pub-id>
          <pub-id pub-id-type="medline">38414074</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13000-024-01464-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC10898121</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Moniz</surname>
              <given-names>JRA</given-names>
            </name>
            <name name-style="western">
              <surname>Bhargava</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jiarui Lu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Piraviperuma</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tseng</surname>
              <given-names>BH</given-names>
            </name>
          </person-group>
          <article-title>Can large language models understand context?</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on February 1, 2024</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2402.00858"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2402.00858</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tran</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Le</surname>
              <given-names>QV</given-names>
            </name>
          </person-group>
          <article-title>Long-form factuality in large language models</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on March 27, 2024</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2403.18802"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2403.18802</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lewis</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Perez</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Piktus</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Petroni</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Karpukhin</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Goyal</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Küttler</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lewis</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yih</surname>
              <given-names>WT</given-names>
            </name>
            <name name-style="western">
              <surname>Rocktäschel</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Riedel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kiela</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Retrieval-augmented generation for knowledge-intensive NLP tasks</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on May 22, 2020</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2005.11401"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2005.11401</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xiong</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Jia</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bi,</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Retrieval-augmented generation for large language models: a survey</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on December 18, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2312.10997"/>
          </comment>
          <pub-id pub-id-type="doi">10.2139/ssrn.4895062</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Sun,</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>FoRAG: Factuality-optimized Retrieval Augmented Generation for web-enhanced long-form question answering</article-title>
          <year>2024</year>
          <conf-name>Proceedings of the 30th ACM SIGKDD Conference on Knowledge Discovery and Data Mining (KDD '24)</conf-name>
          <conf-date>August 25-29, 2024</conf-date>
          <conf-loc>Barcelona, Spain</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3637528.3672065</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>NF</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Hewitt</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Paranjape</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bevilacqua</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Petroni</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Lost in the middle: how language models use long contexts</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on July 6, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2307.03172"/>
          </comment>
          <pub-id pub-id-type="doi">10.1162/tacl_a_00638</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
          <article-title>LOTR (Merger Retriever)</article-title>
          <source>LangChain</source>
          <year>2024</year>
          <access-date>2024-08-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://python.langchain.com/v0.2/docs/integrations/retrievers/merger_retriever/">https://python.langchain.com/v0.2/docs/integrations/retrievers/merger_retriever/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="web">
          <article-title>Better RAG with LOTR-Lord of Retriever</article-title>
          <source>Medium</source>
          <access-date>2024-08-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medium.com/etoai/better-rag-with-lotr-lord-of-retriever-23c8336b9a35">https://medium.com/etoai/better-rag-with-lotr-lord-of-retriever-23c8336b9a35</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>An</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>YC</given-names>
            </name>
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Golden-retriever: high-fidelity agentic retrieval augmented generation for industrial knowledge base</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on July 20, 2024</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2408.00798"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2408.00798</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>SQ</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ling</surname>
              <given-names>ZH</given-names>
            </name>
          </person-group>
          <article-title>Corrective retrieval augmented generation</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on January 29, 2024</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2401.15884"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2401.15884</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="web">
          <article-title>FAQ</article-title>
          <source>Tavily</source>
          <access-date>2024-12-11</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://docs.tavily.com/faq/faq">https://docs.tavily.com/faq/faq</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Asai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sil</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hajishirzi</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Self-RAG: learning to retrieve, generate, and critique through self-reflection</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on October 17, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2310.11511"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2310.11511</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="web">
          <article-title>Office for Human Research Protections: 45 CFR 46</article-title>
          <source>U.S. Department of Health and Human Services</source>
          <year>2025</year>
          <month>02</month>
          <day>11</day>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.hhs.gov/ohrp/regulations-and-policy/regulations/45-cfr-46/index.html">https://www.hhs.gov/ohrp/regulations-and-policy/regulations/45-cfr-46/index.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ferreira Caceres</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Sosa</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Lawrence</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Sestacovschi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tidd-Johnson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rasool</surname>
              <given-names>MHU</given-names>
            </name>
            <name name-style="western">
              <surname>Gadamidi</surname>
              <given-names>VK</given-names>
            </name>
            <name name-style="western">
              <surname>Ozair</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pandav</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Cuevas-Lou</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Parrish</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rodriguez</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Fernandez</surname>
              <given-names>JP</given-names>
            </name>
          </person-group>
          <article-title>The impact of misinformation on the COVID-19 pandemic</article-title>
          <source>AIMS Public Health</source>
          <year>2022</year>
          <volume>9</volume>
          <issue>2</issue>
          <fpage>262</fpage>
          <lpage>277</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35634019"/>
          </comment>
          <pub-id pub-id-type="doi">10.3934/publichealth.2022018</pub-id>
          <pub-id pub-id-type="medline">35634019</pub-id>
          <pub-id pub-id-type="pii">publichealth-09-02-018</pub-id>
          <pub-id pub-id-type="pmcid">PMC9114791</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Di Sotto</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Viviani</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Health misinformation detection in the social web: an overview and a data science approach</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2022</year>
          <month>02</month>
          <day>15</day>
          <volume>19</volume>
          <issue>4</issue>
          <fpage>2173</fpage>
          <lpage>2193</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph19042173"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph19042173</pub-id>
          <pub-id pub-id-type="medline">35206359</pub-id>
          <pub-id pub-id-type="pii">ijerph19042173</pub-id>
          <pub-id pub-id-type="pmcid">PMC8872515</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bateman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jackson</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Countering disinformation effectively: an evidence-based policy guide</article-title>
          <source>Carnegie Endowment for International Peace</source>
          <year>2024</year>
          <access-date>2024-08-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://carnegieendowment.org/research/2024/01/countering-disinformation-effectively-an-evidence-based-policy-guide?lang=en">https://carnegieendowment.org/research/2024/01/countering-disinformation-effectively-an-evidence-based-policy-guide?lang=en</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dixit</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Bhagat</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dangi</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Automating fake news detection using PPCA and levy flight-based LSTM</article-title>
          <source>Soft comput</source>
          <year>2022</year>
          <volume>26</volume>
          <issue>22</issue>
          <fpage>12545</fpage>
          <lpage>12557</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35729952"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s00500-022-07215-4</pub-id>
          <pub-id pub-id-type="medline">35729952</pub-id>
          <pub-id pub-id-type="pii">7215</pub-id>
          <pub-id pub-id-type="pmcid">PMC9202495</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kaliyar</surname>
              <given-names>RK</given-names>
            </name>
            <name name-style="western">
              <surname>Goswami</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Narang</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>EchoFakeD: improving fake news detection in social media with an efficient deep neural network</article-title>
          <source>Neural Comput Appl</source>
          <year>2021</year>
          <volume>33</volume>
          <issue>14</issue>
          <fpage>8597</fpage>
          <lpage>8613</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33424132"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s00521-020-05611-1</pub-id>
          <pub-id pub-id-type="medline">33424132</pub-id>
          <pub-id pub-id-type="pii">5611</pub-id>
          <pub-id pub-id-type="pmcid">PMC7776294</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Ferrara</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>FACT-GPT: fact-checking augmentation via claim matching with LLMs</article-title>
          <year>2024</year>
          <conf-name>Proceedings of the WWW '24: Companion Proceedings of the ACM Web Conference 2024</conf-name>
          <conf-date>May 13-17, 2024</conf-date>
          <conf-loc>New York, NY</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3589335.3651504</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alghamdi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>A comprehensive survey on machine learning approaches for fake news detection</article-title>
          <source>Multimed Tools Appl</source>
          <year>2023</year>
          <month>11</month>
          <day>09</day>
          <volume>83</volume>
          <issue>17</issue>
          <fpage>51009</fpage>
          <lpage>51067</lpage>
          <pub-id pub-id-type="doi">10.1007/s11042-023-17470-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hang</surname>
              <given-names>CN</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>PD</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>CW</given-names>
            </name>
          </person-group>
          <article-title>TrumorGPT: query optimization and semantic reasoning over networks for automated fact-checking</article-title>
          <year>2024</year>
          <conf-name>Proceedings of the 58th Annual Conference on Information Sciences and Systems (CISS)</conf-name>
          <conf-date>March 15, 2024</conf-date>
          <conf-loc>Princeton, NJ</conf-loc>
          <pub-id pub-id-type="doi">10.1109/ciss59072.2024.10480162</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <article-title>WHO Strategic Communications Framework for effective communications. World Health Organization</article-title>
          <source>World Health Organization</source>
          <year>2017</year>
          <access-date>2024-12-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/docs/default-source/documents/communicating-for-health/communication-framework.pdf">https://www.who.int/docs/default-source/documents/communicating-for-health/communication-framework.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chiou</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Voegeli</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wilhelm</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kolis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Brookmeyer</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Prybylski</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The future of infodemic surveillance as public health surveillance</article-title>
          <source>Emerg Infect Dis</source>
          <year>2022</year>
          <month>12</month>
          <volume>28</volume>
          <issue>13</issue>
          <fpage>S121</fpage>
          <lpage>S128</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3201/eid2813.220696"/>
          </comment>
          <pub-id pub-id-type="doi">10.3201/eid2813.220696</pub-id>
          <pub-id pub-id-type="medline">36502389</pub-id>
          <pub-id pub-id-type="pmcid">PMC9745233</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khaliq</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pflugfelder</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Miletić</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>RAGAR, your falsehood radar: RAG-augmented reasoning for political fact-checking using multimodal large language models</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on April 18, 2024</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2404.12065"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/2024.fever-1.29</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Calleja</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>AbdAllah</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Abad</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Albarracin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Altieri</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Anoko</surname>
              <given-names>JN</given-names>
            </name>
            <name name-style="western">
              <surname>Arcos</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Azlan</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Bayer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bechmann</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bezbaruah</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Briand</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Brooks</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Bucci</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Burzo</surname>
              <given-names>Stefano</given-names>
            </name>
            <name name-style="western">
              <surname>Czerniak</surname>
              <given-names>Christine</given-names>
            </name>
            <name name-style="western">
              <surname>De Domenico</surname>
              <given-names>Manlio</given-names>
            </name>
            <name name-style="western">
              <surname>Dunn</surname>
              <given-names>Adam G</given-names>
            </name>
            <name name-style="western">
              <surname>Ecker</surname>
              <given-names>Ullrich K H</given-names>
            </name>
            <name name-style="western">
              <surname>Espinosa</surname>
              <given-names>Laura</given-names>
            </name>
            <name name-style="western">
              <surname>Francois</surname>
              <given-names>Camille</given-names>
            </name>
            <name name-style="western">
              <surname>Gradon</surname>
              <given-names>Kacper</given-names>
            </name>
            <name name-style="western">
              <surname>Gruzd</surname>
              <given-names>Anatoliy</given-names>
            </name>
            <name name-style="western">
              <surname>Gülgün</surname>
              <given-names>Beste Sultan</given-names>
            </name>
            <name name-style="western">
              <surname>Haydarov</surname>
              <given-names>Rustam</given-names>
            </name>
            <name name-style="western">
              <surname>Hurley</surname>
              <given-names>Cherstyn</given-names>
            </name>
            <name name-style="western">
              <surname>Astuti</surname>
              <given-names>Santi Indra</given-names>
            </name>
            <name name-style="western">
              <surname>Ishizumi</surname>
              <given-names>Atsuyoshi</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>Neil</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson Restrepo</surname>
              <given-names>Dylan</given-names>
            </name>
            <name name-style="western">
              <surname>Kajimoto</surname>
              <given-names>Masato</given-names>
            </name>
            <name name-style="western">
              <surname>Koyuncu</surname>
              <given-names>Aybüke</given-names>
            </name>
            <name name-style="western">
              <surname>Kulkarni</surname>
              <given-names>Shibani</given-names>
            </name>
            <name name-style="western">
              <surname>Lamichhane</surname>
              <given-names>Jaya</given-names>
            </name>
            <name name-style="western">
              <surname>Lewis</surname>
              <given-names>Rosamund</given-names>
            </name>
            <name name-style="western">
              <surname>Mahajan</surname>
              <given-names>Avichal</given-names>
            </name>
            <name name-style="western">
              <surname>Mandil</surname>
              <given-names>Ahmed</given-names>
            </name>
            <name name-style="western">
              <surname>McAweeney</surname>
              <given-names>Erin</given-names>
            </name>
            <name name-style="western">
              <surname>Messer</surname>
              <given-names>Melanie</given-names>
            </name>
            <name name-style="western">
              <surname>Moy</surname>
              <given-names>Wesley</given-names>
            </name>
            <name name-style="western">
              <surname>Ndumbi Ngamala</surname>
              <given-names>Patricia</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>Tim</given-names>
            </name>
            <name name-style="western">
              <surname>Nunn</surname>
              <given-names>Mark</given-names>
            </name>
            <name name-style="western">
              <surname>Omer</surname>
              <given-names>Saad B</given-names>
            </name>
            <name name-style="western">
              <surname>Pagliari</surname>
              <given-names>Claudia</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>Palak</given-names>
            </name>
            <name name-style="western">
              <surname>Phuong</surname>
              <given-names>Lynette</given-names>
            </name>
            <name name-style="western">
              <surname>Prybylski</surname>
              <given-names>Dimitri</given-names>
            </name>
            <name name-style="western">
              <surname>Rashidian</surname>
              <given-names>Arash</given-names>
            </name>
            <name name-style="western">
              <surname>Rempel</surname>
              <given-names>Emily</given-names>
            </name>
            <name name-style="western">
              <surname>Rubinelli</surname>
              <given-names>Sara</given-names>
            </name>
            <name name-style="western">
              <surname>Sacco</surname>
              <given-names>PierLuigi</given-names>
            </name>
            <name name-style="western">
              <surname>Schneider</surname>
              <given-names>Anton</given-names>
            </name>
            <name name-style="western">
              <surname>Shu</surname>
              <given-names>Kai</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>Melanie</given-names>
            </name>
            <name name-style="western">
              <surname>Sufehmi</surname>
              <given-names>Harry</given-names>
            </name>
            <name name-style="western">
              <surname>Tangcharoensathien</surname>
              <given-names>Viroj</given-names>
            </name>
            <name name-style="western">
              <surname>Terry</surname>
              <given-names>Robert</given-names>
            </name>
            <name name-style="western">
              <surname>Thacker</surname>
              <given-names>Naveen</given-names>
            </name>
            <name name-style="western">
              <surname>Trewinnard</surname>
              <given-names>Tom</given-names>
            </name>
            <name name-style="western">
              <surname>Turner</surname>
              <given-names>Shannon</given-names>
            </name>
            <name name-style="western">
              <surname>Tworek</surname>
              <given-names>Heidi</given-names>
            </name>
            <name name-style="western">
              <surname>Uakkas</surname>
              <given-names>Saad</given-names>
            </name>
            <name name-style="western">
              <surname>Vraga</surname>
              <given-names>Emily</given-names>
            </name>
            <name name-style="western">
              <surname>Wardle</surname>
              <given-names>Claire</given-names>
            </name>
            <name name-style="western">
              <surname>Wasserman</surname>
              <given-names>Herman</given-names>
            </name>
            <name name-style="western">
              <surname>Wilhelm</surname>
              <given-names>Elisabeth</given-names>
            </name>
            <name name-style="western">
              <surname>Würz</surname>
              <given-names>Andrea</given-names>
            </name>
            <name name-style="western">
              <surname>Yau</surname>
              <given-names>Brian</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Lei</given-names>
            </name>
            <name name-style="western">
              <surname>Purnat</surname>
              <given-names>Tina D</given-names>
            </name>
          </person-group>
          <article-title>A public health research agenda for managing infodemics: methods and results of the First WHO Infodemiology Conference</article-title>
          <source>JMIR Infodemiology</source>
          <year>2021</year>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>e30979</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://infodemiology.jmir.org/2021/1/e30979/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/30979</pub-id>
          <pub-id pub-id-type="medline">34604708</pub-id>
          <pub-id pub-id-type="pii">v1i1e30979</pub-id>
          <pub-id pub-id-type="pmcid">PMC8448461</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>A survey on retrieval-augmented text generation for large language models</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on April 17, 2024</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2404.10981"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2404.10981</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fisher</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rosella</surname>
              <given-names>LC</given-names>
            </name>
          </person-group>
          <article-title>Priorities for successful use of artificial intelligence by public health organizations: a literature review</article-title>
          <source>BMC Public Health</source>
          <year>2022</year>
          <month>11</month>
          <day>22</day>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>2146</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpublichealth.biomedcentral.com/articles/10.1186/s12889-022-14422-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12889-022-14422-z</pub-id>
          <pub-id pub-id-type="medline">36419010</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12889-022-14422-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC9682716</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="web">
          <article-title>Jingyi-H-SH / Use-of-Retrieval-Augmented-Large-Language-Model-for-COVID-19-Fact-Checking-</article-title>
          <source>GitHub</source>
          <access-date>2025-04-21</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/Jingyi-H-SH/Use-of-Retrieval-Augmented-Large-Language-Model-for-COVID-19-Fact-Checking-">https://github.com/Jingyi-H-SH/Use-of-Retrieval-Augmented-Large-Language-Model-for-COVID-19-Fact-Checking-</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
