<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v26i1e60601</article-id>
      <article-id pub-id-type="pmid">39361955</article-id>
      <article-id pub-id-type="doi">10.2196/60601</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Ascle—A Python Natural Language Processing Toolkit for Medical Text Generation: Development and Evaluation Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Wu</surname>
            <given-names>Chaoyi</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Hanne</surname>
            <given-names>Thomas</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>Rui</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0006-0597-7197</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Zeng</surname>
            <given-names>Qingcheng</given-names>
          </name>
          <degrees>BS</degrees>
          <xref rid="aff02" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8697-2729</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>You</surname>
            <given-names>Keen</given-names>
          </name>
          <degrees>BS</degrees>
          <xref rid="aff03" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0009-9534-3041</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Qiao</surname>
            <given-names>Yujie</given-names>
          </name>
          <degrees>MPH</degrees>
          <xref rid="aff04" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0009-7182-2355</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>Lucas</given-names>
          </name>
          <degrees>BS</degrees>
          <xref rid="aff03" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0002-9600-9335</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Hsieh</surname>
            <given-names>Chia-Chun</given-names>
          </name>
          <degrees>BS</degrees>
          <xref rid="aff03" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0005-4074-8659</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Rosand</surname>
            <given-names>Benjamin</given-names>
          </name>
          <degrees>BS</degrees>
          <xref rid="aff03" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8140-9438</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Goldwasser</surname>
            <given-names>Jeremy</given-names>
          </name>
          <degrees>BS</degrees>
          <xref rid="aff03" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0001-4263-2108</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Dave</surname>
            <given-names>Amisha</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff05" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8377-8309</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Keenan</surname>
            <given-names>Tiarnan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff06" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2253-1772</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author">
          <name name-style="western">
            <surname>Ke</surname>
            <given-names>Yuhe</given-names>
          </name>
          <degrees>MBBS</degrees>
          <xref rid="aff07" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7193-4749</ext-link>
        </contrib>
        <contrib id="contrib12" contrib-type="author">
          <name name-style="western">
            <surname>Hong</surname>
            <given-names>Chuan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff08" ref-type="aff">8</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7056-9559</ext-link>
        </contrib>
        <contrib id="contrib13" contrib-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Nan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <xref rid="aff09" ref-type="aff">9</xref>
          <xref rid="aff10" ref-type="aff">10</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3610-4883</ext-link>
        </contrib>
        <contrib id="contrib14" contrib-type="author">
          <name name-style="western">
            <surname>Chew</surname>
            <given-names>Emily</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff06" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0999-9802</ext-link>
        </contrib>
        <contrib id="contrib15" contrib-type="author" deceased="yes">
          <name name-style="western">
            <surname>Radev</surname>
            <given-names>Dragomir</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff03" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7830-6489</ext-link>
        </contrib>
        <contrib id="contrib16" contrib-type="author">
          <name name-style="western">
            <surname>Lu</surname>
            <given-names>Zhiyong</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff11" ref-type="aff">11</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9998-916X</ext-link>
        </contrib>
        <contrib id="contrib17" contrib-type="author">
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>Hua</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff12" ref-type="aff">12</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5274-4672</ext-link>
        </contrib>
        <contrib id="contrib18" contrib-type="author">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Qingyu</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff12" ref-type="aff">12</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6036-1516</ext-link>
        </contrib>
        <contrib id="contrib19" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Irene</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff13" ref-type="aff">13</xref>
          <address>
            <institution>Information Technology Center</institution>
            <institution>University of Tokyo</institution>
            <addr-line>6-2-3 Kashiwanoha</addr-line>
            <addr-line>Kashiwa, 277-8582</addr-line>
            <country>Japan</country>
            <phone>81 09014707813</phone>
            <email>ireneli@ds.itc.u-tokyo.ac.jp</email>
          </address>
          <xref rid="aff14" ref-type="aff">14</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1851-5390</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff01">
        <label>1</label>
        <institution>Centre for Quantitative Medicine</institution>
        <institution>Duke-NUS Medical School</institution>
        <addr-line>Singapore</addr-line>
        <country>Singapore</country>
      </aff>
      <aff id="aff02">
        <label>2</label>
        <institution>Department of Linguistics</institution>
        <institution>Northwestern University</institution>
        <addr-line>Evanston, IL</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff03">
        <label>3</label>
        <institution>Department of Computer Science</institution>
        <institution>Yale University</institution>
        <addr-line>New Haven, CT</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff04">
        <label>4</label>
        <institution>Yale School of Public Health</institution>
        <institution>Yale University</institution>
        <addr-line>New Haven, CT</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff05">
        <label>5</label>
        <institution>Yale New Haven Hospital</institution>
        <institution>Yale School of Medicine</institution>
        <institution>Yale University</institution>
        <addr-line>New Haven, CT</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff06">
        <label>6</label>
        <institution>Division of Epidemiology and Clinical Applications</institution>
        <institution>National Eye Institute, National Institutes of Health</institution>
        <addr-line>Bethesda, MD</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff07">
        <label>7</label>
        <institution>Department of Anesthesiology</institution>
        <institution>Singapore General Hospital</institution>
        <addr-line>Singapore</addr-line>
        <country>Singapore</country>
      </aff>
      <aff id="aff08">
        <label>8</label>
        <institution>Department of Biostatistics and Bioinformatics</institution>
        <institution>Duke University</institution>
        <addr-line>Durham, NC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff09">
        <label>9</label>
        <institution>Program in Health Services and Systems Research</institution>
        <institution>Duke-NUS Medical School</institution>
        <addr-line>Singapore</addr-line>
        <country>Singapore</country>
      </aff>
      <aff id="aff10">
        <label>10</label>
        <institution>Institute of Data Science</institution>
        <institution>National University of Singapore</institution>
        <addr-line>Singapore</addr-line>
        <country>Singapore</country>
      </aff>
      <aff id="aff11">
        <label>11</label>
        <institution>National Center for Biotechnology Information, National Library of Medicine</institution>
        <institution>National Institutes of Health</institution>
        <addr-line>Bethesda, MD</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff12">
        <label>12</label>
        <institution>Department of Biomedical Informatics and Data Science</institution>
        <institution>Yale School of Medicine</institution>
        <institution>Yale University</institution>
        <addr-line>New Haven, CT</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff13">
        <label>13</label>
        <institution>Information Technology Center</institution>
        <institution>University of Tokyo</institution>
        <addr-line>Kashiwa</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff14">
        <label>14</label>
        <institution>Smartor LLC</institution>
        <addr-line>Tokyo</addr-line>
        <country>Japan</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Irene Li <email>ireneli@ds.itc.u-tokyo.ac.jp</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>3</day>
        <month>10</month>
        <year>2024</year>
      </pub-date>
      <volume>26</volume>
      <elocation-id>e60601</elocation-id>
      <history>
        <date date-type="received">
          <day>16</day>
          <month>5</month>
          <year>2024</year>
        </date>
        <date date-type="rev-request">
          <day>13</day>
          <month>6</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>8</day>
          <month>7</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>15</day>
          <month>7</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Rui Yang, Qingcheng Zeng, Keen You, Yujie Qiao, Lucas Huang, Chia-Chun Hsieh, Benjamin Rosand, Jeremy Goldwasser, Amisha Dave, Tiarnan Keenan, Yuhe Ke, Chuan Hong, Nan Liu, Emily Chew, Dragomir Radev, Zhiyong Lu, Hua Xu, Qingyu Chen, Irene Li. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 03.10.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2024/1/e60601" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Medical texts present significant domain-specific challenges, and manually curating these texts is a time-consuming and labor-intensive process. To address this, natural language processing (NLP) algorithms have been developed to automate text processing. In the biomedical field, various toolkits for text processing exist, which have greatly improved the efficiency of handling unstructured text. However, these existing toolkits tend to emphasize different perspectives, and none of them offer generation capabilities, leaving a significant gap in the current offerings.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to describe the development and preliminary evaluation of Ascle. Ascle is tailored for biomedical researchers and clinical staff with an easy-to-use, all-in-one solution that requires minimal programming expertise. For the first time, Ascle provides 4 advanced and challenging generative functions: question-answering, text summarization, text simplification, and machine translation. In addition, Ascle integrates 12 essential NLP functions, along with query and search capabilities for clinical databases.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We fine-tuned 32 domain-specific language models and evaluated them thoroughly on 27 established benchmarks. In addition, for the question-answering task, we developed a retrieval-augmented generation (RAG) framework for large language models that incorporated a medical knowledge graph with ranking techniques to enhance the reliability of generated answers. Additionally, we conducted a physician validation to assess the quality of generated content beyond automated metrics.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The fine-tuned models and RAG framework consistently enhanced text generation tasks. For example, the fine-tuned models improved the machine translation task by 20.27 in terms of BLEU score. In the question-answering task, the RAG framework raised the ROUGE-L score by 18% over the vanilla models. Physician validation of generated answers showed high scores for readability (4.95/5) and relevancy (4.43/5), with a lower score for accuracy (3.90/5) and completeness (3.31/5).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This study introduces the development and evaluation of Ascle, a user-friendly NLP toolkit designed for medical text generation. All code is publicly available through the Ascle GitHub repository. All fine-tuned language models can be accessed through Hugging Face.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>natural language processing</kwd>
        <kwd>machine learning</kwd>
        <kwd>deep learning</kwd>
        <kwd>generative artificial intelligence</kwd>
        <kwd>large language models</kwd>
        <kwd>retrieval-augmented generation</kwd>
        <kwd>healthcare</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Medical texts pose considerable challenges due to their domain-specific nature, including issues such as ambiguities, frequent abbreviations, and specialized terminology [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. The manual curation of these texts is both time-consuming and labor-intensive [<xref ref-type="bibr" rid="ref2">2</xref>]. Therefore, natural language processing (NLP) algorithms have been developed to automate text processing [<xref ref-type="bibr" rid="ref2">2</xref>-<xref ref-type="bibr" rid="ref4">4</xref>]. Recent years have seen a notable shift toward the use of domain-specific pretrained language models, transitioning from shallow embeddings such as BioWordVec [<xref ref-type="bibr" rid="ref5">5</xref>] and BioSentVec [<xref ref-type="bibr" rid="ref6">6</xref>] to advanced architectures like Bidirectional Encoder Representations from Transformers (BERT) [<xref ref-type="bibr" rid="ref7">7</xref>], such as BioBERT [<xref ref-type="bibr" rid="ref8">8</xref>], ClinicalBERT [<xref ref-type="bibr" rid="ref9">9</xref>], and PubMedBERT [<xref ref-type="bibr" rid="ref10">10</xref>]. Furthermore, large language models (LLMs), such as Med-PaLM [<xref ref-type="bibr" rid="ref11">11</xref>] and Med-Gemini [<xref ref-type="bibr" rid="ref12">12</xref>], have demonstrated powerful generative capabilities, possessing exceptional zero- and few-shot performance. These domain-specific language models have substantially enhanced the effectiveness of NLP tasks in the biomedical and clinical domains [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref15">15</xref>].</p>
      <p>Despite the success of these advanced methods, their complexity remains a significant barrier to practical application for health care professionals lacking basic programming skills. Consequently, there is an increasing demand for user-friendly and accessible toolkits designed to simplify medical text processing. Multiple toolkits for text processing are available in the biomedical domain. <xref ref-type="table" rid="table1">Table 1</xref> summarizes representative tools. While there are many other useful tools, here we mainly limit our comparison with Python-based open-source toolkits.</p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>A comparison of Ascle with existing Python-based toolkits.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="230"/>
          <col width="130"/>
          <col width="130"/>
          <col width="130"/>
          <col width="130"/>
          <col width="130"/>
          <col width="120"/>
          <thead>
            <tr valign="top">
              <td>Toolkits</td>
              <td>Question-<break/>Answering<sup>a</sup></td>
              <td>Text<break/>Summarization</td>
              <td>Text<break/>Simplification</td>
              <td>Machine<break/>Translation</td>
              <td>Basic NLP<sup>b</sup> Functions</td>
              <td>Query Search</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>MIMIC-Extract [<xref ref-type="bibr" rid="ref16">16</xref>]</td>
              <td>—<sup>c</sup></td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>✓</td>
            </tr>
            <tr valign="top">
              <td>ScispaCy [<xref ref-type="bibr" rid="ref17">17</xref>]</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>✓</td>
              <td>—</td>
            </tr>
            <tr valign="top">
              <td>MedspaCy [<xref ref-type="bibr" rid="ref18">18</xref>]</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>✓</td>
              <td>—</td>
            </tr>
            <tr valign="top">
              <td>Transformers-sklearn [<xref ref-type="bibr" rid="ref19">19</xref>]</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>✓</td>
              <td>—</td>
            </tr>
            <tr valign="top">
              <td>Stanza Biomed [<xref ref-type="bibr" rid="ref20">20</xref>]</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>✓</td>
              <td>—</td>
            </tr>
            <tr valign="top">
              <td>Ascle (this study)</td>
              <td>✓</td>
              <td>✓</td>
              <td>✓</td>
              <td>✓</td>
              <td>✓</td>
              <td>✓</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table1fn1">
            <p><sup>a</sup>For the question-answering task, we specifically propose a retrieval-augmented generation framework for large language models that incorporates a medical knowledge graph with ranking techniques.</p>
          </fn>
          <fn id="table1fn2">
            <p><sup>b</sup>NLP: natural language processing. Basic natural language processing functions include abbreviation extraction, sentence tokenization, word tokenization, negation detection, hyponym detection, Unified Medical Language System concept extraction, named entity recognition, document clustering, part-of-speech tagging, entity linking, text summarization (extractive methods), and multiple-choice question-answering. It is worth noting that not every toolkit includes these 12 basic natural language processing functions, but Ascle includes them all.</p>
          </fn>
          <fn id="table1fn3">
            <p><sup>c</sup>Not applicable.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <p>These existing toolkits tend to emphasize different perspectives, and none of them offer generation capabilities, leaving a significant gap in the current offerings. In response, we present Ascle, a pioneering NLP toolkit for medical text generation, which, for the first time, includes 4 advanced generative functions. We fine-tuned 32 domain-specific language models and evaluated them thoroughly on 27 established benchmarks. In addition, for the question-answering task, we developed a retrieval-augmented generation (RAG) framework [<xref ref-type="bibr" rid="ref21">21</xref>] that combines a medical knowledge graph (The Unified Medical Language System [UMLS]) [<xref ref-type="bibr" rid="ref22">22</xref>] with ranking techniques, aimed at improving the reliability of long-form answers [<xref ref-type="bibr" rid="ref15">15</xref>]. We uploaded all fine-tuned language models to Hugging Face and listed 32 fine-tuned language models along with 27 benchmarks in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for a clearer explanation.</p>
      <p>In conclusion, Ascle empowers a diverse spectrum of users, from novices to experienced professionals, enabling them to effortlessly address their NLP tasks, even with limited technical expertise in handling textual data. We believe that Ascle not only democratizes access to cutting-edge methods but also expedites their integration into health care.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>The Overall Architecture of Ascle</title>
        <p>Ascle consists of 3 modules, with the core module being the “generative functions,” including 4 challenging generation tasks: question-answering, text summarization, text simplification, and machine translation, covering a variety of application scenarios in health care. In addition, Ascle integrates 12 basic NLP functions, as well as query and search capabilities for clinical databases. The overall architecture of Ascle is shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>. This section will focus on introducing the core module of Ascle—Generative Functions. For more information on basic NLP functions and query and search functions within Ascle, please refer to <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> and <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>, respectively.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>The overall architecture of Ascle. <inline-graphic xlink:href="jmir_v26i1e60601_fig4.png" mimetype="image" xlink:type="simple"/> indicates that we have our fine-tuned language models for this task. <inline-graphic xlink:href="jmir_v26i1e60601_fig5.png" mimetype="image" xlink:type="simple"/> indicates that we conducted evaluations for this task. POS: Parts-Of-Speech; QA: Question-Answering; UMLS: Unified Medical Language System.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e60601_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Generative Functions</title>
        <p>Ascle offers a range of generative functions through pretrained and fine-tuned language models, all of which are publicly available for user access. In the following sections, we will introduce these powerful generative functions separately.</p>
        <sec>
          <title>Question-Answering</title>
          <p>Question-answering is particularly crucial in health care [<xref ref-type="bibr" rid="ref13">13</xref>]. When integrated into health care systems, it assumes roles, such as preconsultation and remote consultation, effectively coping with the exponential increase in patient load. Furthermore, specialized question-answering systems hold the potential to contribute to medical education [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref21">21</xref>].</p>
          <p>In Ascle, we first provide an interface for medical LLMs, such as Baize-healthcare [<xref ref-type="bibr" rid="ref23">23</xref>], allowing users to use them directly. In addition, we develop a RAG framework that uses UMLS with ranking techniques to enhance LLMs in generating long-form answers [<xref ref-type="bibr" rid="ref21">21</xref>]. Specifically, when receiving a query, the RAG framework first extracts medical entities within the query automatically and then retrieves related triplets from UMLS for each extracted entity. A triplet consists of 2 medical concepts and the relation between them, that is, (Myopia, clinically_associated_with, HYPERGLYCEMIA). Subsequently, the RAG framework uses ranking and reranking techniques to refine the ordering of these triples. Finally, the query and the retrieved triplets would be prompted to LLM for inference. For more details about the RAG framework, please refer to <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>. We apply this framework to the GPT (OpenAI) [<xref ref-type="bibr" rid="ref24">24</xref>] and LLaMA (Meta) [<xref ref-type="bibr" rid="ref25">25</xref>] series of LLMs.</p>
          <p>We conducted evaluations on 4 medical QA data sets, including LiveQA [<xref ref-type="bibr" rid="ref26">26</xref>], ExpertQA (Med &#38; Bio) [<xref ref-type="bibr" rid="ref27">27</xref>], and MedicationQA [<xref ref-type="bibr" rid="ref28">28</xref>]. LiveQA consists of health questions submitted by consumers to the National Library of Medicine. It includes a training set with 634 QA pairs and a test set comprising 104 QA pairs, and the test set was used for evaluation. ExpertQA is a high-quality long-form QA data set covering multiple fields, along with answers verified by domain experts. Among them, we used 504 medical questions (Med) and 96 biology (Bio) questions for evaluation. MedicationQA includes 690 drug-related consumer questions along with information retrieved from reliable websites and scientific papers.</p>
          <p>Additionally, considering that automated metrics cannot effectively assess the quality of generated content, especially in terms of factuality, we performed a physician validation. A total of 50 question-answer pairs from LiveQA were randomly selected, with answers generated by Baize-healthcare. Subsequently, 2 health care professionals (1 resident and 1 attending specialist) rated these generated answers on the criteria of readability, relevancy, accuracy, and completeness, using a 5-point Likert scale.</p>
        </sec>
        <sec>
          <title>Text Summarization</title>
          <p>In health care, clinicians and researchers are confronted with an increasing amount of information, including literature, clinical notes, and more [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. Text summarization is an important generation task, aiming to distill essential information from the overwhelming complexity of texts and compress it into a more concise format [<xref ref-type="bibr" rid="ref31">31</xref>]. Through automatic text summarization, clinicians and researchers can efficiently acquire information, thereby avoiding information overload.</p>
          <p>We provide an abstractive text summarization function and compare general pretrained summarization models, including Pegasus [<xref ref-type="bibr" rid="ref32">32</xref>], BigBird [<xref ref-type="bibr" rid="ref33">33</xref>], Bidirectional and Auto-Regressive Transformer (BART) [<xref ref-type="bibr" rid="ref34">34</xref>], PRIMERA [<xref ref-type="bibr" rid="ref35">35</xref>], as well as domain-specific models, such as SciFive [<xref ref-type="bibr" rid="ref36">36</xref>] and BioBART [<xref ref-type="bibr" rid="ref37">37</xref>], which make use of biomedical corpora. Furthermore, we chose PubMed [<xref ref-type="bibr" rid="ref38">38</xref>], MIMIC Chest X-Ray (MIMIC-CXR [<xref ref-type="bibr" rid="ref39">39</xref>]), and MEDIQA-AnS [<xref ref-type="bibr" rid="ref40">40</xref>] data sets for evaluation. The PubMed data set consists of biomedical scientific publications from the PubMed database, where each input document is a scientific article with its abstract serving as the ground truth. We reported the evaluation results for the test set, which contains 1660 examples. MIMIC-CXR is a deidentified data set of chest radiographs with free-text radiology reports, and we used a subset of MIMIC-CXR that includes 2000 instances for evaluation. MEDIQA-AnS is a collection of 156 consumer health questions along with passages that contain relevant information. It supports both single-document and multiple-document summarization evaluation.</p>
        </sec>
        <sec>
          <title>Text Simplification</title>
          <p>Biomedical texts are typically laden with intricate terminologies, which can hinder the understanding of individuals without a clinical background [<xref ref-type="bibr" rid="ref41">41</xref>]. In Ascle, the function of text simplification is to translate complex and technical biomedical texts into understandable content. This will enhance the comprehension and involvement of nonclinical individuals, including patients, enabling them to better engage with the information and participate in clinical decisions more effectively.</p>
          <p>We finetuned and evaluated widely used pretrained language models on 3 data sets: eLife, PLOS [<xref ref-type="bibr" rid="ref42">42</xref>], and MedLane [<xref ref-type="bibr" rid="ref43">43</xref>]. This included 2 general models, BigBirdPegasus [<xref ref-type="bibr" rid="ref32">32</xref>] and BART, as well as a biomedical-specific model, BioBART. The eLife and PLOS are shared task data released from the BioLaySumm 2023 Task 1, which contains biomedical journal articles with expert-written lay summaries. We evaluated the validation sets for eLife and PLOS, which contain 241 and 1376 examples, respectively. MedLane is a large-scale human-annotated data set containing professional-to-customer sentences selected from Medical Information Mart for Intensive Care III (MIMIC-III). For MedLane, we used the test set for evaluation, which includes 1016 instances.</p>
        </sec>
        <sec>
          <title>Machine Translation</title>
          <p>Language barriers pose difficulties for patients to access timely information and communicate effectively with health care providers, resulting in low-quality health care services [<xref ref-type="bibr" rid="ref44">44</xref>]. Our machine translation function aims to translate the text from a source language into a target language in a clinical scenario. By fine-tuning pretrained language models on the medical corpus, Ascle supports machine translation from English (en) to 8 target languages: Spanish (es), French (fr), Romanian (ro), Czech (cs), German (de), Hungarian (hu), Polish (pl), and Swedish (sv). Here, we only emphasize the 8 languages fine-tuned on medical data, while other languages, such as English to Chinese, are supported by the pretrained language models.</p>
          <p>We fine-tuned the existing MarianMT [<xref ref-type="bibr" rid="ref45">45</xref>] and multilingual T5 [<xref ref-type="bibr" rid="ref46">46</xref>] using UFAL Medical Corpus [<xref ref-type="bibr" rid="ref47">47</xref>] which includes various medical text sources, such as titles of medical Wikipedia articles, medical term pairs, patents, and documents from the European Medicines Agency. During the preprocessing phase, we excluded general domain data from UFAL, such as parliamentary proceedings, and randomly shuffled the medical domain corpora, splitting them into 2 parts at a ratio of 85% and 15% for training and testing, respectively. We reported the results on the test set, the size of which varies from 111,779 to 407,388 depending on the different language pairs. Furthermore, for each language pair, we used all available parallel data to maximize the breadth and accuracy of our machine translation function.</p>
        </sec>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>This study used publicly available data sets and a restricted, deidentified data set. Access to the restricted data set was granted after the required training and certification, ensuring compliance with the data use agreement. No additional ethical review or informed consent was necessary, as human subjects or identifiable data were not directly involved. Two health care professionals voluntarily participated in the physician validation process without compensation. Data privacy and confidentiality were strictly maintained throughout the research, ensuring the protection of individual privacy while contributing to the advancement of the NLP toolkit for medical text generation.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Overall Performance of Generation Tasks</title>
        <p>In the question-answering task, we used ROUGE-L [<xref ref-type="bibr" rid="ref48">48</xref>], BERTScore [<xref ref-type="bibr" rid="ref49">49</xref>], MoverScore [<xref ref-type="bibr" rid="ref50">50</xref>], and BLEURT [<xref ref-type="bibr" rid="ref51">51</xref>] for a comprehensive evaluation, and used GPT-4 and LLaMA2-13b as the vanilla LLMs. As shown in <xref ref-type="table" rid="table2">Table 2</xref>, our RAG framework surpasses the zero-shot setting on all evaluation metrics for the LiveQA, ExpertQA-Bio, ExpertQA-Med, and MedicationQA data sets. Among them, the ROUGE-L score has increased by more than 18% on the ExpertQA-Bio data set.</p>
        <p>For the text summarization task, we evaluated 5 pretrained language models on single-document summarization, as shown in <xref ref-type="table" rid="table3">Table 3</xref>. To ensure a fair comparison, we excluded the results of BioBART and SciFive on PubMed, as they were fine-tuned on this data set. It is worth noting that BART consistently demonstrated strong performance across 3 benchmarks, while BioBART only outperformed BART in 1 of the benchmarks. In addition, we evaluated the multidocument summarization task and discussed the differences between abstractive and extractive methods, as well as the limitations of evaluation metrics, which can be found in the Discussion section.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>For the evaluation of the question-answering task, we compared ROUGE-L, BERTScore, MoverScore, and BLEURT on the zero-shot and retrieval-augmented generation framework.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="100"/>
            <col width="0"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="100"/>
            <col width="0"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <thead>
              <tr valign="top">
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="5">LLaMa2-13b</td>
                <td colspan="4">GPT-4</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <break/>
                </td>
                <td>ROUGE-L</td>
                <td>BERTScore</td>
                <td>MoverScore</td>
                <td>BLEURT</td>
                <td colspan="2">ROUGE -L</td>
                <td>BERTScore</td>
                <td>MoverScore</td>
                <td>BLEURT</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="12">
                  <bold>LiveQA<sup>a</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Z.S<sup>b</sup></td>
                <td>17.73</td>
                <td>81.93</td>
                <td>53.37</td>
                <td>40.45</td>
                <td colspan="2">18.89</td>
                <td>82.50</td>
                <td>54.02</td>
                <td>39.84</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">RAG<sup>c</sup></td>
                <td>18.83<sup>d</sup></td>
                <td>82.79<sup>d</sup></td>
                <td>53.79<sup>d</sup></td>
                <td>40.59<sup>d</sup></td>
                <td colspan="2">19.44<sup>d</sup></td>
                <td>83.01<sup>d</sup></td>
                <td>54.11<sup>d</sup></td>
                <td>40.55<sup>d</sup></td>
              </tr>
              <tr valign="top">
                <td colspan="12">
                  <bold>ExpertQA<sup>a</sup>-Bio</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Z.S</td>
                <td>23.26</td>
                <td>84.38</td>
                <td>55.58</td>
                <td>44.65</td>
                <td colspan="2">23.00</td>
                <td>84.50</td>
                <td>56.15</td>
                <td>44.53</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">RAG</td>
                <td>25.79<sup>d</sup></td>
                <td>85.18<sup>d</sup></td>
                <td>56.17<sup>d</sup></td>
                <td>45.20<sup>d</sup></td>
                <td colspan="2">27.20<sup>d</sup></td>
                <td>85.83<sup>d</sup></td>
                <td>57.11<sup>d</sup></td>
                <td>45.91<sup>d</sup></td>
              </tr>
              <tr valign="top">
                <td colspan="12">
                  <bold>ExpertQA<sup>a</sup>-Med</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Z.S</td>
                <td>24.86</td>
                <td>84.89</td>
                <td>55.74</td>
                <td>46.32</td>
                <td colspan="2">25.45</td>
                <td>85.11</td>
                <td>56.50</td>
                <td>45.98</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">RAG</td>
                <td>27.49<sup>d</sup></td>
                <td>85.80<sup>d</sup></td>
                <td>56.58<sup>d</sup></td>
                <td>46.47<sup>d</sup></td>
                <td colspan="2">28.08<sup>d</sup></td>
                <td>86.30<sup>d</sup></td>
                <td>57.32<sup>d</sup></td>
                <td>47.00<sup>d</sup></td>
              </tr>
              <tr valign="top">
                <td colspan="12">
                  <bold>MedicationQA<sup>a</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Z.S</td>
                <td>13.30</td>
                <td>81.81</td>
                <td>51.96</td>
                <td>38.30</td>
                <td colspan="2">14.41</td>
                <td>82.55</td>
                <td>52.62</td>
                <td>37.41</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">RAG</td>
                <td>14.71<sup>d</sup></td>
                <td>82.79<sup>d</sup></td>
                <td>52.59<sup>d</sup></td>
                <td>38.42<sup>d</sup></td>
                <td colspan="2">16.19<sup>d</sup></td>
                <td>83.59<sup>d</sup></td>
                <td>53.30<sup>d</sup></td>
                <td>37.91<sup>d</sup></td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>QA: question-answering.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>Z.S: zero-shot.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>RAG: retrieval-augmented generation framework.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>The superior score within the same data set.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>For the evaluation of the single-document summarization task, we compared ROUGE-1, ROUGE-2, ROUGE-L, and some results are derived from other papers [<xref ref-type="bibr" rid="ref52">52</xref>].</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="130"/>
            <col width="70"/>
            <col width="70"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <col width="70"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <col width="70"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <col width="70"/>
            <col width="100"/>
            <thead>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="4">PubMed</td>
                <td colspan="4">MIMIC-CXR<sup>a</sup></td>
                <td colspan="4">MEDIQA-AnS (p)</td>
                <td colspan="3">MEDIQA-AnS (s)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>R-1</td>
                <td>R-2</td>
                <td>R-L</td>
                <td colspan="2">R-1</td>
                <td>R-2</td>
                <td>R-L</td>
                <td colspan="2">R-1</td>
                <td>R-2</td>
                <td>R-L</td>
                <td colspan="2">R-1</td>
                <td>R-2</td>
                <td>R-L</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Pegasus</td>
                <td>45.97</td>
                <td>20.15</td>
                <td>28.25</td>
                <td colspan="2">22.49</td>
                <td>11.57</td>
                <td>20.35</td>
                <td colspan="2">18.29</td>
                <td>4.82</td>
                <td>13.87</td>
                <td colspan="2">22.21</td>
                <td>8.23</td>
                <td>16.76</td>
              </tr>
              <tr valign="top">
                <td>BigBird</td>
                <td>46.32</td>
                <td>20.65</td>
                <td>42.33<sup>b</sup></td>
                <td colspan="2">38.99</td>
                <td>29.52</td>
                <td>38.59</td>
                <td colspan="2">13.18</td>
                <td>2.14</td>
                <td>10.04</td>
                <td colspan="2">14.89</td>
                <td>3.13</td>
                <td>11.15</td>
              </tr>
              <tr valign="bottom">
                <td>BART</td>
                <td>48.35<sup>b</sup></td>
                <td>21.43<sup>b</sup></td>
                <td>36.90</td>
                <td colspan="2">41.70<sup>b</sup></td>
                <td>32.93<sup>b</sup></td>
                <td>41.16<sup>b</sup></td>
                <td colspan="2">24.02<sup>b</sup></td>
                <td>7.20</td>
                <td>17.09<sup>b</sup></td>
                <td colspan="2">38.19</td>
                <td>22.20</td>
                <td>30.58</td>
              </tr>
              <tr valign="top">
                <td>SciFive</td>
                <td>—<sup>c</sup></td>
                <td>—</td>
                <td>—</td>
                <td colspan="2">35.41</td>
                <td>26.48</td>
                <td>35.07</td>
                <td colspan="2">13.08</td>
                <td>2.15</td>
                <td>10.10</td>
                <td colspan="2">16.88</td>
                <td>6.47</td>
                <td>14.42</td>
              </tr>
              <tr valign="bottom">
                <td>BioBART</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td colspan="2">41.61</td>
                <td>32.90</td>
                <td>41.00</td>
                <td colspan="2">22.58</td>
                <td>7.49<sup>b</sup></td>
                <td>16.69</td>
                <td colspan="2">39.40<sup>b</sup></td>
                <td>24.64<sup>b</sup></td>
                <td>32.07<sup>b</sup></td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>MIMIC-CXR: MIMIC Chest X-Ray database.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>The superior score within the same data set.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>Not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>Regarding the text simplification task, we compared the performance of fine-tuned models and conducted an analysis of readability using the Flesch-Kincaid Grade Level (FKGL) score [<xref ref-type="bibr" rid="ref53">53</xref>], as indicated in <xref ref-type="table" rid="table4">Table 4</xref>. For the eLife and PLOS data sets, the ground truth exhibits FKGL scores of 12 and 15, respectively. Interestingly, the BioBART model performs competitively in terms of ROUGE metrics, but fails to significantly reduce the difficulty of understanding, as evidenced by its FKGL score of 17 in both data sets. On the other hand, the BART model manages to slightly lower the FKGL score to 14 and 16 for eLife and PLOS, respectively. However, in the case of the MedLane data set, all methods appear to reach a similar level of complexity as the ground truth. This can be attributed to the data set’s shorter examples and potentially smaller vocabulary size, which limits the observed differences.</p>
        <p>In the machine translation task, we fine-tuned the models across 8 languages, as illustrated in <xref ref-type="table" rid="table5">Table 5</xref>. After fine-tuning, the BLEU scores significantly improved, with the most substantial improvement observed in the “en-fr” language pair, increasing by over 61%. This enhancement can be attributed to the larger amount of training data available for “en-fr” (2,812,305 samples).</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>For evaluation of the text simplification task, we compared ROUGE-1, ROUGE-2, ROUGE-L, and Flesch-Kincaid Grade Level score.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="140"/>
            <col width="70"/>
            <col width="70"/>
            <col width="70"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <col width="70"/>
            <col width="70"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <col width="70"/>
            <col width="70"/>
            <col width="90"/>
            <thead>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="5">eLife</td>
                <td colspan="5">PLOS</td>
                <td colspan="4">MedLane</td>
              </tr>
              <tr valign="bottom">
                <td>
                  <break/>
                </td>
                <td>R-1<sup>a</sup></td>
                <td>R-2<sup>b</sup></td>
                <td>R-L<sup>c</sup></td>
                <td>FKGL<sup>d</sup></td>
                <td colspan="2">R-1</td>
                <td>R-2</td>
                <td>R-L</td>
                <td>FKGL</td>
                <td colspan="2">R-1</td>
                <td>R-2</td>
                <td>R-L</td>
                <td>FKGL</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="bottom">
                <td>Ground Truth</td>
                <td>—<sup>e</sup></td>
                <td>—</td>
                <td>—</td>
                <td>12</td>
                <td colspan="2">—</td>
                <td>—</td>
                <td>—</td>
                <td>15</td>
                <td colspan="2">—</td>
                <td>—</td>
                <td>—</td>
                <td>13</td>
              </tr>
              <tr valign="bottom">
                <td>BigBirdPegasus</td>
                <td>14.00</td>
                <td>3.42</td>
                <td>9.16</td>
                <td>13<sup>f</sup></td>
                <td colspan="2">18.92</td>
                <td>4.79</td>
                <td>12.54</td>
                <td>17</td>
                <td colspan="2">74.96</td>
                <td>65.37</td>
                <td>74.56</td>
                <td>13<sup>f</sup></td>
              </tr>
              <tr valign="bottom">
                <td>BART</td>
                <td>16.16<sup>f</sup></td>
                <td>4.31<sup>f</sup></td>
                <td>10.19<sup>f</sup></td>
                <td>14</td>
                <td colspan="2">21.09</td>
                <td>7.20</td>
                <td>14.17</td>
                <td>16<sup>f</sup></td>
                <td colspan="2">83.25<sup>f</sup></td>
                <td>74.50<sup>f</sup></td>
                <td>82.99<sup>f</sup></td>
                <td>13<sup>f</sup></td>
              </tr>
              <tr valign="bottom">
                <td>BioBART</td>
                <td>14.31</td>
                <td>3.70</td>
                <td>9.36</td>
                <td>17</td>
                <td colspan="2">23.80<sup>f</sup></td>
                <td>7.83<sup>f</sup></td>
                <td>15.65<sup>f</sup></td>
                <td>17</td>
                <td colspan="2">82.89</td>
                <td>74.26</td>
                <td>82.65</td>
                <td>13<sup>f</sup></td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>R-1: ROUGE-1.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>R-2: ROUGE-2.</p>
            </fn>
            <fn id="table4fn3">
              <p><sup>c</sup>R-L: ROUGE-L.</p>
            </fn>
            <fn id="table4fn4">
              <p><sup>d</sup>FKGL: Flesch-Kincaid Grade Level.</p>
            </fn>
            <fn id="table4fn5">
              <p><sup>e</sup>Not applicable.</p>
            </fn>
            <fn id="table4fn6">
              <p><sup>f</sup>The superior score within the same data set.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>For the evaluation of the machine translation task, we evaluated the BLEU score on 8 language pairs.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="170"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="130"/>
            <thead>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="8">BLEU score</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>en-es<sup>a</sup></td>
                <td>en-fr<sup>b</sup></td>
                <td>en-ro<sup>c</sup></td>
                <td>en-cs<sup>d</sup></td>
                <td>en-de<sup>e</sup></td>
                <td>en-hu<sup>f</sup></td>
                <td>en-pl<sup>g</sup></td>
                <td>en-sv<sup>h</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>MarianMT</td>
                <td>38.02</td>
                <td>33.02</td>
                <td>40.45</td>
                <td>—<sup>i</sup></td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>F.T-MarianMT</td>
                <td>41.64</td>
                <td>43.72</td>
                <td>43.88</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="bottom">
                <td>F.T-mT5</td>
                <td>45.88<sup>j</sup></td>
                <td>53.29<sup>j</sup></td>
                <td>47.28<sup>j</sup></td>
                <td>43.30</td>
                <td>50.73</td>
                <td>32.25</td>
                <td>40.24</td>
                <td>44.17</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>en-es: English-Spanish.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>en-fr: English-French.</p>
            </fn>
            <fn id="table5fn3">
              <p><sup>c</sup>en-ro: English-Romanian.</p>
            </fn>
            <fn id="table5fn4">
              <p><sup>d</sup>en-cs: English-Czech.</p>
            </fn>
            <fn id="table5fn5">
              <p><sup>e</sup>en-de: English-German.</p>
            </fn>
            <fn id="table5fn6">
              <p><sup>f</sup>en-hu: English-Hungarian.</p>
            </fn>
            <fn id="table5fn7">
              <p><sup>g</sup>en-pl: English-Polish.</p>
            </fn>
            <fn id="table5fn8">
              <p><sup>h</sup>en-sv: English-Swedish.</p>
            </fn>
            <fn id="table5fn9">
              <p><sup>i</sup>Not applicable.</p>
            </fn>
            <fn id="table5fn10">
              <p><sup>j</sup>The superior score within the same data set.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Physician Validation</title>
        <p>The results verified by the physicians are shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>A. Detailed evaluation criteria can be found in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>. The generated answers have good readability and relatively good relevancy, with scores of 4.95 and 4.43, respectively. In contrast, the completeness score is relatively lower (3.31). <xref rid="figure2" ref-type="fig">Figure 2</xref>B shows 2 cases. In the first case, compared with the ground truth, the generated answer does not point out that Zolmitriptan is used for treating acute migraines, nor does it indicate that it cannot be used to prevent migraine attacks or to reduce the frequency of headaches. In the second case, the generated answer does not mention that a gluten-free diet is the main treatment for celiac disease. We provide 2 additional cases in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>.</p>
        <p>In addition, we calculated the interevaluator agreement using percentage agreement for each criterion. A total of 2 health care professionals demonstrated a high level of consistency across all criteria, with the percentage agreement consistently exceeding 0.65.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>(A) Physician validation (readability, relevancy, accuracy, and completeness) for 50 question-answer pairs. (B) Two examples of generated answers with ground truth.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e60601_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>In-Depth Analysis of the Text Summarization Task</title>
        <p>In the multidocument summarization task, we included models based on traditional methods, such as TextRank [<xref ref-type="bibr" rid="ref54">54</xref>], as well as pretrained language models, such as BART, Pegasus, PRIMERA, and BioBART. We evaluated their performance using ROUGE scores on the MEDIQA-AnS data set, which consists of 156 examples, and the results are shown in <xref ref-type="table" rid="table6">Table 6</xref>. However, it is noteworthy that although TextRank outperforms almost all generative models in ROUGE scores, this does not necessarily indicate superior performance. As ROUGE scores are calculated based on the overlap between the generated content and reference summaries, and TextRank is an extractive summarization model, it tends to score higher by this measure.</p>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>Evaluation for the multidocument summarization task.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="200"/>
            <col width="130"/>
            <col width="130"/>
            <col width="130"/>
            <col width="0"/>
            <col width="130"/>
            <col width="130"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="4">MEDIQA-AnS (p)</td>
                <td colspan="3">MEDIQA-AnS (s)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>ROUGE-1</td>
                <td>ROUGE-2</td>
                <td>ROUGE-L</td>
                <td colspan="2">ROUGE-1</td>
                <td>ROUGE-2</td>
                <td>ROUGE-L</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="bottom">
                <td>TextRank<sup>a</sup></td>
                <td>29.88</td>
                <td>10.23</td>
                <td>17.01</td>
                <td colspan="2">43.77</td>
                <td>26.80</td>
                <td>30.52</td>
              </tr>
              <tr valign="bottom">
                <td>BART</td>
                <td>24.56<sup>b</sup></td>
                <td>7.56<sup>b</sup></td>
                <td>17.18<sup>b</sup></td>
                <td colspan="2">32.32<sup>b</sup></td>
                <td>15.42</td>
                <td>24.03<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>Pegasus</td>
                <td>17.44</td>
                <td>5.36</td>
                <td>13.44</td>
                <td colspan="2">19.54</td>
                <td>7.46</td>
                <td>14.93</td>
              </tr>
              <tr valign="top">
                <td>PRIMERA</td>
                <td>16.66</td>
                <td>4.89</td>
                <td>12.68</td>
                <td colspan="2">21.78</td>
                <td>9.77</td>
                <td>16.85</td>
              </tr>
              <tr valign="bottom">
                <td>BioBART</td>
                <td>23.16</td>
                <td>7.47</td>
                <td>16.47</td>
                <td colspan="2">30.87</td>
                <td>15.91<sup>b</sup></td>
                <td>23.66</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table6fn1">
              <p><sup>a</sup>TextRank is only used as a reference for extractive summarization, so its scores are not compared with those of generative models.</p>
            </fn>
            <fn id="table6fn2">
              <p><sup>b</sup>The superior score within the same data set.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>While generative models possess semantic comprehension abilities, enabling them to distill complex information into an easy-to-understand format. As shown in <xref ref-type="boxed-text" rid="box1">Textbox 1</xref>, the summarizations generated by BART display well-structured patient information, with a brief description of events and corresponding conditions of the current patient (highlighted in blue), exhibiting high readability. In contrast, the summarizations produced by TextRank are less readable and include noise (highlighted in orange); the generated content is often a literal collage of text fragments. Despite TextRank achieving higher ROUGE scores, it lacks the ability to discern information and integrate it into coherent and readable content, showing significant limitations for practical use.</p>
        <boxed-text id="box1" position="float">
          <title>Two MIMIC-III (parts) examples of the text summarization task, generated by BART and TextRank, respectively (we eliminated sensitive information).</title>
          <p>
            <bold>BART</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>The patient is an XXX-year-old man with a history of a question of coronary artery disease, borderline diabetes mellitus. He was in his usual state of health until 11 p.m. last night when he experienced chest pain with radiation to his back, positive shortness of breath, positive diaphoresis, no vomiting, no lightheadedness. The patient had had a similar episode of chest pain and was taken to an XXX. He had successful angioplasty and stent of LAD and CX. He is a middle aged XXX man in no acute hypertensive distress. He has had anginal chest pain, which is similar to his presenting complaint, but without radiations to his Back. His blood pressure was 105/73, pulse 84, respiratory 21, O2 saturation 92% on 2 liters. His CPK was 594, The index was 7.7, and he was admitted to the hospital with a high blood pressure. His condition was described as “stable” and “normal” by the doctor. The doctor referred the patient to a cardiologist for further treatment. The cardiologist said the patient was in good condition and should be discharged in a few days.</p>
            </list-item>
            <list-item>
              <p>Patient has CABG complicated by postop bleed and pleural effusion with discharge to [**Hospital1 **] Rehabilitation presents with abdominal pain. Zosyn was given in the ED. Patient was otherwise doing well and was to go back to rehab to finish his course of Cipro and Flagyl on [**5-17**]. Patient was last seen normal sometime last evening. He woke up and noticed that the left side of his body felt “numb”. He was not aware of any other</p>
              <p>neurological weakness, and mostly complained of being very tired. He denied any new vision problems, did not have a headache. He sounded somewhat slurred but did not feel as if his speech was changed significantly. He felt sleepy but able to sustain attention, currently apparently in no distress. He was on standing. Plavix and [**State **] which had been held for the last few days (at least since the 14), since he had the percutaneous drainage. He did not. feel that the weakness had progress and reported that he felt the sense of numbness was starting to improve and had some difficulty squeezing an examiners hand. He is a retired postal worker. He lives with wife and son who is a chiropractor.</p>
            </list-item>
          </list>
          <p>
            <bold>TextRank</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>Admission Date: XXX Discharge Date: XXX Date of Birth: Sex: M Service: CCU-6HISTORY OF PRESENT ILLNESS: The patient is a XXX-year-old man with a history of a question of coronary artery disease, status post myocardial infarction in [**December 2175**], hypertension, borderline diabetes mellitus who was in his usual state of health until 11 p.m. last night when, while [**4-12**] midsternal pressure like chest pain with radiation to back, positive shortness of breath, positive diaphoresis, positive nausea, no vomiting, no lightheadedness. Mucous membranes moist. Oropharynx clear. NECK:  No jugular venous distention, no carotid bruits. CARDIOVASCULAR:  Regular rate, S1, S2, artificial S1 gallop and balloon pump, no murmurs or rubs. LUNGS: Bibasilar rales, left greater than right. ABDOMEN:  Normoactive bowel sounds, nontender, nondistended. EXTREMITIES:  No cyanosis, clubbing or edema. NEUROLOGIC:  Alert and oriented x3.LABS AT OUTSIDE HOSPITAL:  CPK was 304, troponin 1.75.Electrocardiogram at 1:23 a.m. was normal sinus rhythm at101, normal axis deviation, 2 to [**Street Address(2) 1755**] elevation V1 to V5,Q V3, AVF.LABS AT [**Hospital6 **] AT 8 A.M.:  CBC- white blood cells 11.2, hemoglobin 13.0, hematocrit 36.7,platelets 232. CARDIOVASCULAR: Coronary artery disease: Three vessel disease with successful intervention on LAD and left circumflex, but RCA not done secondary to good collateral. The patient was continued on aspirin 325 qd.</p>
            </list-item>
            <list-item>
              <p>Of note he was on standing Plavix and [**State **] which had been held for the last few days (atleast since the 14), since he had the percutaneous drainage. The patient was otherwise doing well and was to go back to rehab to finish his course of Cipro and Flagyl on [**5-17**].Past Medical History: coronary artery disease s/p right coronary artery stent x2([**10-3**], [**3-4**]), hypertension, hyperlipidemia, chronic obstructive pulmonary disease, asbestos exposure, chronic back pain, insomnia and obstructive sleep apnea (untreated)PSH:[**2144-4-21**]Endoscopic, minimally invasive, off pump coronary artery bypass graft x1 with left internal mammary artery to left anterior descending artery.[**2144-4-21**]Re-exploration for bleeding, post coronary artery bypass grafting. Social History: Lives with wife. Exposure to asbestos. Defers all medical decisions to son who is a chiropractor. Occupation: retired postal worker. Tobacco: 3 PPD x 30 years, quit 45 years ago ETOH: None Family History: Non-contributory to cholecystitis. Physical Exam: Physical Exam: Vitals: T: 97.9  P:75  R: 16  BP:128/73  SaO2:96 General: Awake, felt sleepy but able to sustain attention, poor historian currently.</p>
            </list-item>
          </list>
        </boxed-text>
      </sec>
      <sec>
        <title>System Usage</title>
        <p>Ascle provides an easy-to-use approach for biomedical researchers and clinical staff. Users can efficiently use it by merely inputting text and calling the required functions. <xref rid="figure3" ref-type="fig">Figure 3</xref> illustrates 2 use cases.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Demonstration of system usage. We show two use cases: Text Simplification and Machine Translation.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e60601_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Estimated Inference Time and Computational Resources</title>
        <p>As shown in <xref ref-type="table" rid="table7">Table 7</xref>, we list the estimated inference time and computational resources required for the 4 generative tasks in Ascle. It is worth noting that the inference time is specific to our experimental settings, and the actual inference time for users may vary depending on the length of the input text and the computational resources used. For the question-answering task, GPT’s response time is faster compared with LLaMA2-13b. However, it is important to mention that LLaMA2-13b was not deployed with quantization, and with quantization, the required inference time and computational resource requirements would be reduced.</p>
        <table-wrap position="float" id="table7">
          <label>Table 7</label>
          <caption>
            <p>Estimated inference time and computational resources required for the generative tasks in Ascle.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="300"/>
            <col width="320"/>
            <col width="380"/>
            <thead>
              <tr valign="top">
                <td>Tasks</td>
                <td>Estimated inference time</td>
                <td>Computational resource</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Question Answering</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>LLaMA2-13b: &#60;60 s/item<sup>a</sup></p>
                    </list-item>
                    <list-item>
                      <p>GPT4: &#60;15 s/item</p>
                    </list-item>
                  </list>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>LLaMA2-13b: 4 * NVIDIA A100 GPU</p>
                    </list-item>
                    <list-item>
                      <p>GPT4: OpenAI API<sup>b</sup></p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>Text Summarization</td>
                <td>&#60;2 s/item</td>
                <td>1 * NVIDIA V100 GPU</td>
              </tr>
              <tr valign="top">
                <td>Text Simplification</td>
                <td>&#60;2 s/item</td>
                <td>1 * NVIDIA V100 GPU</td>
              </tr>
              <tr valign="top">
                <td>Machine translation</td>
                <td>&#60;2 s/item</td>
                <td>1 * NVIDIA V100 GPU</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table7fn1">
              <p><sup>a</sup>s/item: seconds per item.</p>
            </fn>
            <fn id="table7fn2">
              <p><sup>b</sup>API: application programming interface.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Clinicians’ Use of Ascle</title>
        <p>To evaluate the ease of usability of Ascle for clinicians, we report the time required for 2 clinicians with different backgrounds to use the package after receiving guidance. The backgrounds of the clinicians are as follows: (1) physician 1: Singapore General Hospital, senior resident, 7 years of working experience, has a basic level of programming knowledge, and is able to perform basic statistical analyses; and (2) physician 2: SengKang General Hospital, senior consultant, 15 years of working experience, and has no programming knowledge.</p>
        <p>Both clinicians received guidance on using Ascle, including setting up a virtual environment and accessing models from Hugging Face. The entire guidance process took about 10 minutes, after which both clinicians could independently and easily use Ascle and experiment with various generative functions without any issues. The main difficulty for the clinicians was setting up the virtual environment, as they lacked AI-specific knowledge. In response, Ascle provided a very simple virtual environment setup guideline. The clinicians’ experience further confirms the user-friendliness of Ascle.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>In the case of generation tasks, we primarily chose automatic metrics for evaluation, such as ROUGE and BLEU scores. However, these metrics cannot effectively assess factual correctness [<xref ref-type="bibr" rid="ref55">55</xref>] and may not align with human preference [<xref ref-type="bibr" rid="ref56">56</xref>]. While human evaluation serves as an invaluable aspect in assessing the performance of the model, its incorporation may pose certain challenges due to various factors, including budget constraints.</p>
      </sec>
      <sec>
        <title>Future Work</title>
        <p>Recent LLMs have shown great potential in generative applications especially its superior zero- and few-shot performance [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref58">58</xref>]. Despite this, the generated content can be unfaithful, inconsistent, and biased [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref60">60</xref>]. We plan to thoroughly evaluate LLMs and extend to Ascle in the future. Meanwhile, we will strengthen the ethical review of these generative AI techniques to ensure their application truly and responsibly benefits biomedical researchers and health care professionals [<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref62">62</xref>].</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>We introduce Ascle, a comprehensive NLP toolkit designed specifically for medical text generation. For the first time, it integrates 4 challenging generative functions, including question-answering, text summarization, text simplification, and machine translation. Our research fills the gap of existing toolkits for generative tasks, which holds significant implications for the entire medical domain. Ascle boasts remarkable flexibility, allowing users to access a variety of cutting-edge pretrained language models. Meanwhile, it stands as a user-friendly toolkit, ensuring ease of use even for clinical staff without a technical background. We will continue to maintain and extend Ascle.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>32 Fine-tuned language models and 27 benchmarks in Ascle.</p>
        <media xlink:href="jmir_v26i1e60601_app1.docx" xlink:title="DOCX File , 20 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Basic natural language processing functions in Ascle.</p>
        <media xlink:href="jmir_v26i1e60601_app2.docx" xlink:title="DOCX File , 192 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Query and search module in Ascle.</p>
        <media xlink:href="jmir_v26i1e60601_app3.docx" xlink:title="DOCX File , 14 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>The Retrieval-Augmented Generation framework in Ascle – KG-Rank.</p>
        <media xlink:href="jmir_v26i1e60601_app4.docx" xlink:title="DOCX File , 189 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Evaluation criteria for physician validation.</p>
        <media xlink:href="jmir_v26i1e60601_app5.docx" xlink:title="DOCX File , 16 KB"/>
      </supplementary-material>
      <supplementary-material id="app6">
        <label>Multimedia Appendix 6</label>
        <p>Case study.</p>
        <media xlink:href="jmir_v26i1e60601_app6.docx" xlink:title="DOCX File , 15 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">BART</term>
          <def>
            <p>Bidirectional and Auto-Regressive Transformer</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">BERT</term>
          <def>
            <p>Bidirectional Encoder Representations from Transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">FKGL</term>
          <def>
            <p>Flesch-Kincaid Grade Level</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">RAG</term>
          <def>
            <p>Retrieval-Augmented Generation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">UMLS</term>
          <def>
            <p>Unified Medical Language System</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>TK and EC were supported by the National Institutes of Health (NIH) Intramural Research Program (IRP), National Eye Institute. ZL and QC were supported by the NIH IRP, National Library of Medicine. QC was also supported by the National Library of Medicine of the NIH (award 1K99LM014024). IL was supported by the Japan Society for the Promotion of Science (JSPS) KAKENHI (grant 24K20832). RY and IL received support from GCP Credit Award by Google.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>RY, QZ, KY, YQ, LH, CCH, BR, JG, YHK, and IL performed the data collection, data processing, and experiments. AD, TK conducted manual reviews. RY, QC, and IL created the figures and tables and drafted the manuscript. CH, NL, EC, DR, ZL, HX, QC, and IL were responsible for project administration. All authors conceived the idea for the article.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Yasunaga</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nuzumlalı</surname>
              <given-names>MY</given-names>
            </name>
            <name name-style="western">
              <surname>Caraballo</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mahajan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Krumholz</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Radev</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>A neural topic-attention model for medical term abbreviation disambiguation</article-title>
          <source>ArXiv. Preprint posted online on October 30, 2019</source>
          <year>2019</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1910.14076"/>
          </comment>
          <pub-id pub-id-type="doi">10.5260/chara.21.2.8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Goldwasser</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Verma</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>WP</given-names>
            </name>
            <name name-style="western">
              <surname>Nuzumlalı</surname>
              <given-names>MY</given-names>
            </name>
            <name name-style="western">
              <surname>Rosand</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Krumholz</surname>
              <given-names>HM</given-names>
            </name>
            <name name-style="western">
              <surname>Radev</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Neural natural language processing for unstructured data in electronic health records: a review</article-title>
          <source>Computer Science Review</source>
          <year>2022</year>
          <volume>46</volume>
          <fpage>100511</fpage>
          <pub-id pub-id-type="doi">10.1016/j.cosrev.2022.100511</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shickel</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tighe</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bihorac</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rashidi</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Deep EHR: a survey of recent advances in deep learning techniques for electronic health record (EHR) analysis</article-title>
          <source>IEEE J Biomed Health Inform</source>
          <year>2018</year>
          <volume>22</volume>
          <issue>5</issue>
          <fpage>1589</fpage>
          <lpage>1604</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29989977"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/JBHI.2017.2767063</pub-id>
          <pub-id pub-id-type="medline">29989977</pub-id>
          <pub-id pub-id-type="pmcid">PMC6043423</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>al-Aiad</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Duwairi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Fraihat</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Survey: deep learning concepts and techniques for electronic health record</article-title>
          <year>2018</year>
          <conf-name>IEEE/ACS 15th International Conference on Computer Systems and Applications (AICCSA)</conf-name>
          <conf-date>2018 October 28 - 2018 November 01</conf-date>
          <conf-loc>Aqaba, Jordan</conf-loc>
          <publisher-name>IEEE</publisher-name>
          <fpage>1</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="doi">10.1109/aiccsa.2018.8612827</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>BioWordVec, improving biomedical word embeddings with subword information and MeSH</article-title>
          <source>Sci Data</source>
          <year>2019</year>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>52</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31076572"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41597-019-0055-0</pub-id>
          <pub-id pub-id-type="medline">31076572</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41597-019-0055-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC6510737</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>BioSentVec: creating sentence embeddings for biomedical texts</article-title>
          <year>2019</year>
          <conf-name>IEEE International Conference on Healthcare Informatics (ICHI)</conf-name>
          <conf-date>June 10-13, 2019</conf-date>
          <conf-loc>Xi'an, China</conf-loc>
          <publisher-name>IEEE</publisher-name>
          <fpage>1</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="doi">10.1109/ichi.2019.8904728</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>BERT: pre-training of deep bidirectional transformers for language understanding</article-title>
          <source>ArXiv. Preprint posted online on May 24, 2019</source>
          <year>2019</year>
          <fpage>1</fpage>
          <lpage>16</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1810.04805"/>
          </comment>
          <pub-id pub-id-type="doi">10.5260/chara.21.2.8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yoon</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>So</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>BioBERT: a pre-trained biomedical language representation model for biomedical text mining</article-title>
          <source>Bioinformatics</source>
          <year>2020</year>
          <volume>36</volume>
          <issue>4</issue>
          <fpage>1234</fpage>
          <lpage>1240</lpage>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btz682</pub-id>
          <pub-id pub-id-type="medline">31501885</pub-id>
          <pub-id pub-id-type="pii">5566506</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alsentzer</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Boag</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>WH</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Naumann</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>McDermott</surname>
              <given-names>MBA</given-names>
            </name>
          </person-group>
          <article-title>Publicly available clinical BERT embeddings</article-title>
          <source>Association for Computational Linguistics</source>
          <year>2019</year>
          <conf-name>the 2nd Clinical Natural Language Processing Workshop</conf-name>
          <conf-date>June 2019</conf-date>
          <conf-loc>Minneapolis, Minnesota, USA</conf-loc>
          <fpage>72</fpage>
          <lpage>78</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/w19-1909</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tinn</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lucas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Usuyama</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Naumann</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Poon</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Domain-specific language model pretraining for biomedical natural language processing</article-title>
          <source>ACM Trans. Comput. Healthcare</source>
          <year>2021</year>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>23</lpage>
          <pub-id pub-id-type="doi">10.1145/3458754</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Singhal</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gottweis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sayres</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wulczyn</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Pfohl</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cole-Lewis</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Neal</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Schaekermann</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Amin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lachgar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mansfield</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Prakash</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Green</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Dominowska</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Arcas</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Tomasev</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Semturs</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mahdavi</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Barral</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Webster</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Matias</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Azizi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Karthikesalingam</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Natarajan</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Towards expert-level medical question answering with large language models</article-title>
          <source>ArXiv. Preprint posted online on May 16, 2023</source>
          <year>2023</year>
          <pub-id pub-id-type="doi">10.48550/arXiv.2305.09617</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saab</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>WH</given-names>
            </name>
            <name name-style="western">
              <surname>Tanno</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Stutz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wulczyn</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Strother</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Vedadi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Chaves</surname>
              <given-names>JZ</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Schaekermann</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kamath</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Barrett</surname>
              <given-names>DGT</given-names>
            </name>
            <name name-style="western">
              <surname>Cheung</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mustafa</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Palepu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>McDuff</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Golany</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Alayrac</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Houlsby</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Tomasev</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Freyberg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kemp</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Azizi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kanada</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Man</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kulkarni</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Shakeri</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Caine</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Webson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Latysheva</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mansfield</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rivlin</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Green</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Krause</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shlens</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dominowska</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Eslami</surname>
              <given-names>EMA</given-names>
            </name>
            <name name-style="western">
              <surname>Chou</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Vinyals</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Kavukcuoglu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Manyika</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hassabis</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Matias</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Webster</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Barral</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Semturs</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mahdavi</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Gottweis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Karthikesalingam</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Natarajan</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Capabilities of gemini models in medicine</article-title>
          <source>ArXiv. Preprint posted online on May 1, 2024</source>
          <year>2024</year>
          <pub-id pub-id-type="doi">10.48550/arXiv.2404.18416</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>TF</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Thirunavukarasu</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ting</surname>
              <given-names>DSW</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Large language models in health care: development, applications, and challenges</article-title>
          <source>Health Care Sci</source>
          <year>2023</year>
          <volume>2</volume>
          <issue>4</issue>
          <fpage>255</fpage>
          <lpage>263</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38939520"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/hcs2.61</pub-id>
          <pub-id pub-id-type="medline">38939520</pub-id>
          <pub-id pub-id-type="pii">HCS261</pub-id>
          <pub-id pub-id-type="pmcid">PMC11080827</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mowery</surname>
              <given-names>DL</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Vurgun</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Hwang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Donnelly</surname>
              <given-names>HK</given-names>
            </name>
            <name name-style="western">
              <surname>Bandhey</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Akhtar</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Senathirajah</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sadhu</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Getzen</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Freda</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Long</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Becich</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Realizing the potential of social determinants data: a scoping review of approaches for screening, linkage, extraction, analysis and interventions</article-title>
          <source>medRxiv. Preprint posted online on February 6, 2024</source>
          <year>2024</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38370703"/>
          </comment>
          <pub-id pub-id-type="doi">10.1101/2024.02.04.24302242</pub-id>
          <pub-id pub-id-type="medline">38370703</pub-id>
          <pub-id pub-id-type="pii">2024.02.04.24302242</pub-id>
          <pub-id pub-id-type="pmcid">PMC10871446</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ning</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Keppo</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bitterman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ting</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Retrieval-augmented generation for generative artificial intelligence in medicine</article-title>
          <source>ArXiv. Preprint posted online on June 18, 2024</source>
          <year>2024</year>
          <pub-id pub-id-type="doi">10.48550/ARXIV.2406.12449</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>McDermott</surname>
              <given-names>MBA</given-names>
            </name>
            <name name-style="western">
              <surname>Chauhan</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hughes</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Naumann</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>MIMIC-Extract</article-title>
          <year>2020</year>
          <conf-name>CHIL '20: Proceedings of the ACM Conference on Health, Inference, and Learning</conf-name>
          <conf-date>April 2-4, 2020</conf-date>
          <conf-loc>New York, USA</conf-loc>
          <publisher-loc>USA</publisher-loc>
          <publisher-name>ACM</publisher-name>
          <fpage>222</fpage>
          <lpage>235</lpage>
          <pub-id pub-id-type="doi">10.1145/3368555.3384469</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Neumann</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Beltagy</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Ammar</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>ScispaCy: Fast and robust models for biomedical natural language processing</article-title>
          <year>2019</year>
          <conf-name>Proceedings of the 18th BioNLP Workshop and Shared Task Stroudsburg</conf-name>
          <conf-date>August 1, 2019</conf-date>
          <conf-loc>Florence, Italy</conf-loc>
          <publisher-loc>USA</publisher-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <fpage>319</fpage>
          <lpage>327</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/w19-5034</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eyre</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Alba</surname>
              <given-names>PR</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Box</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>DuVall</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Patterson</surname>
              <given-names>OV</given-names>
            </name>
          </person-group>
          <article-title>Launching into clinical space with medspaCy: a new clinical text processing toolkit in Python</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2022</year>
          <volume>2021</volume>
          <fpage>438</fpage>
          <lpage>447</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35308962"/>
          </comment>
          <pub-id pub-id-type="medline">35308962</pub-id>
          <pub-id pub-id-type="pii">3576697</pub-id>
          <pub-id pub-id-type="pmcid">PMC8861690</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Transformers-sklearn: a toolkit for medical language understanding with transformer-based models</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2021</year>
          <volume>21</volume>
          <issue>Suppl 2</issue>
          <fpage>90</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-021-01459-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-021-01459-0</pub-id>
          <pub-id pub-id-type="medline">34330244</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-021-01459-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC8323195</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Qi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Langlotz</surname>
              <given-names>CP</given-names>
            </name>
          </person-group>
          <article-title>Biomedical and clinical English model packages for the stanza python NLP library</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2021</year>
          <volume>28</volume>
          <issue>9</issue>
          <fpage>1892</fpage>
          <lpage>1899</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/34157094"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocab090</pub-id>
          <pub-id pub-id-type="medline">34157094</pub-id>
          <pub-id pub-id-type="pii">6307885</pub-id>
          <pub-id pub-id-type="pmcid">PMC8363782</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Marrese-Taylor</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Ke</surname>
              <given-names>YH</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Caverlee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Matsuo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>KG-Rank: Enhancing large language models for medical QA with knowledge graphs and ranking techniques</article-title>
          <source>ArXiv. Preprint posted online on July 04, 2024</source>
          <year>2024</year>
          <pub-id pub-id-type="doi">10.48550/ARXIV.2403.05881</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bodenreider</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>The unified medical language system (UMLS): integrating biomedical terminology</article-title>
          <source>Nucleic Acids Res</source>
          <year>2004</year>
          <volume>32</volume>
          <issue>Database issue</issue>
          <fpage>D267</fpage>
          <lpage>D270</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://nar.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=14681409"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gkh061</pub-id>
          <pub-id pub-id-type="medline">14681409</pub-id>
          <pub-id pub-id-type="pii">32/suppl_1/D267</pub-id>
          <pub-id pub-id-type="pmcid">PMC308795</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Duan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>McAuley</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Baize: an open-source chat model with parameter-efficient tuning on self-chat data</article-title>
          <year>2023</year>
          <conf-name>Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing</conf-name>
          <conf-date>December 2023</conf-date>
          <conf-loc>Singapore</conf-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <fpage>6268</fpage>
          <lpage>6278</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2023.emnlp-main.385</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>OpenAI</collab>
            <name name-style="western">
              <surname>Achiam</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Adler</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Agarwal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmad</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Akkaya</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Aleman</surname>
              <given-names>FL</given-names>
            </name>
            <name name-style="western">
              <surname>Almeida</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Altenschmidt</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Anadkat</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Avila</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Babuschkin</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Balaji</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Balcom</surname>
              <given-names>V et al</given-names>
            </name>
          </person-group>
          <article-title>GPT-4 Technical Report</article-title>
          <source>ArXiv. Preprint posted online on March 04, 2024</source>
          <year>2024</year>
          <pub-id pub-id-type="doi">10.48550/ARXIV.2303.08774</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Touvron</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Stone</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Albert</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Almahairi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Babaei</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Bashlykov</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Batra</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bhargava</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bhosale</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bikel</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Blecher</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ferrer</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cucurull</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Esiobu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Fernandes</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Fuller</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Goswami</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Goyal</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hartshorn</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hosseini</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Inan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kardas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kerkez</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Khabsa</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kloumann</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Korenev</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Koura</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Lachaux</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lavril</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liskovich</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Mao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Martinet</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Mihaylov</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Molybog</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Nie</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Poulton</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Reizenstein</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rungta</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Saladi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Schelten</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Silva</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Subramanian</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kuan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zarov</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kambadur</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Narang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rodriguez</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Stojnic</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Edunov</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Scialom</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Llama 2: open foundation and fine-tuned chat models</article-title>
          <source>ArXiv. Preprint posted online on July 19, 2023</source>
          <year>2024</year>
          <pub-id pub-id-type="doi">10.48550/ARXIV.2307.09288</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abacha</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Agichtein</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Pinter</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Demner-Fushman</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Overview of the medical question answering task at TREC 2017 LiveQA</article-title>
          <year>2018</year>
          <conf-name>Text REtrieval Conference (TREC)</conf-name>
          <conf-date>May 2017</conf-date>
          <conf-loc>Gaithersburg, MD, USA</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://trec.nist.gov/pubs/trec26/papers/Overview-QA.pdf?ref=https://githubhelp.com"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Malaviya</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sieber</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Yatskar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Roth</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>ExpertQA: expert-curated questions and attributed answers</article-title>
          <source>ArXiv. Preprint posted online on April 02, 2024</source>
          <year>2024</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/pdf/2309.07852"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2309.07852</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abacha</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Mrabet</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sharp</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Goodwin</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Shooshan</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Demner-Fushman</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Bridging the gap between consumers' medication questions and trusted answers</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2019</year>
          <volume>264</volume>
          <fpage>25</fpage>
          <lpage>29</lpage>
          <pub-id pub-id-type="doi">10.3233/SHTI190176</pub-id>
          <pub-id pub-id-type="medline">31437878</pub-id>
          <pub-id pub-id-type="pii">SHTI190176</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fiszman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Weir</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Jonnalagadda</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mostafa</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Del Fiol</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Text summarization in the biomedical domain: a systematic review of recent research</article-title>
          <source>J Biomed Inform</source>
          <year>2014</year>
          <volume>52</volume>
          <fpage>457</fpage>
          <lpage>467</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(14)00147-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2014.06.009</pub-id>
          <pub-id pub-id-type="medline">25016293</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(14)00147-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC4261035</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ke</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Comparing open-access database and traditional intensive care studies using machine learning: bibliometric analysis study</article-title>
          <source>J Med Internet Res</source>
          <year>2024</year>
          <volume>26</volume>
          <fpage>e48330</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2024//e48330/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/48330</pub-id>
          <pub-id pub-id-type="medline">38630522</pub-id>
          <pub-id pub-id-type="pii">v26i1e48330</pub-id>
          <pub-id pub-id-type="pmcid">PMC11063894</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ananiadou</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A survey for biomedical text summarization: from pre-trained to large language models</article-title>
          <source>ArXiv. Preprint posted online on July 13, 2023</source>
          <year>2024</year>
          <pub-id pub-id-type="doi">10.48550/ARXIV.2304.08763</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Saleh</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>PEGASUS: pre-training with extracted gap-sentences for abstractive summarization</article-title>
          <source>ArXiv. Preprint posted online on July 10, 2020</source>
          <year>2020</year>
          <pub-id pub-id-type="doi">10.48550/ARXIV.1912.08777</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zaheer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Guruganesh</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Dubey</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ainslie</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Alberti</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ontanon</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pham</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ravula</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Big bird: transformers for longer sequences</article-title>
          <source>ArXiv. Preprint posted online on January 08, 2021</source>
          <year>2021</year>
          <pub-id pub-id-type="doi">10.48550/ARXIV.2007.14062</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lewis</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Goyal</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ghazvininejad</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mohamed</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Stoyanov</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Zettlemoyer</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>BART: denoising sequence-to-sequence pre-training for natural language generation, translation, and comprehension</article-title>
          <year>2020</year>
          <conf-name>Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics</conf-name>
          <conf-date>July 2020</conf-date>
          <conf-loc>Online</conf-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <fpage>7871</fpage>
          <lpage>7880</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2020.acl-main.703</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Beltagy</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Carenini</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cohan</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>PRIMERA: pyramid-based masked sentence pre-training for multi-document summarization</article-title>
          <year>2022</year>
          <conf-name>Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics</conf-name>
          <conf-date>May 2022</conf-date>
          <conf-loc>Dublin, Ireland</conf-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <pub-id pub-id-type="doi">10.18653/v1/2022.acl-long.360</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Phan</surname>
              <given-names>LN</given-names>
            </name>
            <name name-style="western">
              <surname>Anibal</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Tran</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chanana</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bahadroglu</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Peltekian</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Altan-Bonnet</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>SciFive: a text-to-text transformer model for biomedical literature</article-title>
          <source>ArXiv. Preprint posted online on May 28, 2021</source>
          <year>2021</year>
          <pub-id pub-id-type="doi">10.48550/ARXIV.2106.03598</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Gan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>BioBART: pretraining and evaluation of a biomedical generative language model</article-title>
          <year>2022</year>
          <conf-name>Proceedings of the 21st Workshop on Biomedical Language Processing</conf-name>
          <conf-date>May 2022</conf-date>
          <conf-loc>Dublin, Ireland</conf-loc>
          <publisher-loc>BioBART</publisher-loc>
          <publisher-name>Pretraining and evaluation of A biomedical generative language model. arXiv</publisher-name>
          <fpage>97</fpage>
          <lpage>109</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2022.bionlp-1.9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cohan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dernoncourt</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bui</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Goharian</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>A discourse-aware attention model for abstractive summarization of long documents</article-title>
          <year>2018</year>
          <conf-name>Proceedings of the 2018 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies</conf-name>
          <conf-date>June 2018</conf-date>
          <conf-loc>New Orleans, Louisiana</conf-loc>
          <fpage>615</fpage>
          <lpage>621</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/n18-2097</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>AEW</given-names>
            </name>
            <name name-style="western">
              <surname>Pollard</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Berkowitz</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Greenbaum</surname>
              <given-names>NR</given-names>
            </name>
            <name name-style="western">
              <surname>Lungren</surname>
              <given-names>MP</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>CY</given-names>
            </name>
            <name name-style="western">
              <surname>Mark</surname>
              <given-names>RG</given-names>
            </name>
            <name name-style="western">
              <surname>Horng</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>MIMIC-CXR, a de-identified publicly available database of chest radiographs with free-text reports</article-title>
          <source>Sci Data</source>
          <year>2019</year>
          <day>1</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>317</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41597-019-0322-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41597-019-0322-0</pub-id>
          <pub-id pub-id-type="medline">31831740</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41597-019-0322-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC6908718</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Savery</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Abacha</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Gayen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Demner-Fushman</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Question-driven summarization of answers to consumer health questions</article-title>
          <source>Sci Data</source>
          <year>2020</year>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>322</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41597-020-00667-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41597-020-00667-z</pub-id>
          <pub-id pub-id-type="medline">33009402</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41597-020-00667-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC7532186</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devaraj</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wallace</surname>
              <given-names>BC</given-names>
            </name>
            <name name-style="western">
              <surname>Marshall</surname>
              <given-names>IJ</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>JJ</given-names>
            </name>
          </person-group>
          <article-title>Paragraph-level Simplification of medical texts</article-title>
          <source>Proc Conf</source>
          <year>2021</year>
          <volume>2021</volume>
          <fpage>4972</fpage>
          <lpage>4984</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35663507"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/2021.naacl-main.395</pub-id>
          <pub-id pub-id-type="medline">35663507</pub-id>
          <pub-id pub-id-type="pmcid">PMC9161242</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goldsack</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Scarton</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Making science simple: corpora for the lay summarisation of scientific literature</article-title>
          <year>2022</year>
          <conf-name>Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing</conf-name>
          <conf-date>December 2022</conf-date>
          <conf-loc>Abu Dhabi, United Arab Emirates</conf-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <fpage>10589</fpage>
          <lpage>10604</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2022.emnlp-main.724</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>You</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Benchmarking automated clinical language simplification: dataset, algorithm, and evaluation</article-title>
          <source>ArXiv. Preprint posted online on September 21, 2023</source>
          <year>2024</year>
          <pub-id pub-id-type="doi">10.48550/ARXIV.2012.02420</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khoong</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Rodriguez</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>A research agenda for using machine translation in clinical medicine</article-title>
          <source>J Gen Intern Med</source>
          <year>2022</year>
          <volume>37</volume>
          <issue>5</issue>
          <fpage>1275</fpage>
          <lpage>1277</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35132559"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11606-021-07164-y</pub-id>
          <pub-id pub-id-type="medline">35132559</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11606-021-07164-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC8971300</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Junczys-Dowmunt</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Grundkiewicz</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dwojak</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Hoang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Heafield</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Neckermann</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Seide</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Germann</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Aji</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bogoychev</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Martins</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Birch</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Marian: fast neural machine translation in C++</article-title>
          <year>2018</year>
          <conf-name>Proceedings of ACL 2018, System Demonstrations</conf-name>
          <conf-date>July 2018</conf-date>
          <conf-loc>Melbourne, Australia</conf-loc>
          <publisher-loc>Association for Computational Linguistics</publisher-loc>
          <fpage>116</fpage>
          <lpage>121</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/p18-4020</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xue</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Constant</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kale</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Rfou</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Siddhant</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Barua</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Raffel</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>mT5: A massively multilingual pre-trained text-to-text transformer</article-title>
          <year>2021</year>
          <conf-name>Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies</conf-name>
          <conf-date>June 2021</conf-date>
          <conf-loc>Online</conf-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <fpage>483</fpage>
          <lpage>498</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2021.naacl-main.41</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="web">
          <source>UFAL Medical Corpus v. 1.0</source>
          <access-date>2024-08-06</access-date>
          <publisher-name>UFAL MediCorp</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ufal.mff.cuni.cz/ufal_medical_corpus">https://ufal.mff.cuni.cz/ufal_medical_corpus</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>CY</given-names>
            </name>
          </person-group>
          <article-title>ROUGE: a package for automatic evaluation of summaries</article-title>
          <year>2004</year>
          <conf-name>Text Summarization Branches Out</conf-name>
          <conf-date>July 2004</conf-date>
          <conf-loc>Barcelona, Spain</conf-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <fpage>74</fpage>
          <lpage>81</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/W04-1013.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kishore</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Weinberger</surname>
              <given-names>KQ</given-names>
            </name>
            <name name-style="western">
              <surname>Artzi</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>BERTScore: evaluating text generation with BERT</article-title>
          <source>ArXiv. Preprint posted online on February 24, 2020</source>
          <year>2020</year>
          <pub-id pub-id-type="doi">10.5260/chara.21.2.8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Peyrard</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Eger</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>MoverScore: text generation evaluating with contextualized embeddings and earth mover distance</article-title>
          <year>2019</year>
          <conf-name>Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP)</conf-name>
          <conf-date>November 2019</conf-date>
          <conf-loc>Hong Kong, China</conf-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <fpage>563</fpage>
          <lpage>578</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/d19-1053</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sellam</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Das</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Parikh</surname>
              <given-names>AP</given-names>
            </name>
          </person-group>
          <article-title>BLEURT: learning robust metrics for text generation</article-title>
          <source>ArXiv. Preprint posted online on May 21, 2020</source>
          <year>2020</year>
          <pub-id pub-id-type="doi">10.48550/ARXIV.2004.04696</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rohde</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Hierarchical learning for generation with long source sequences</article-title>
          <source>ArXiv. Preprint posted online on September 16, 2021</source>
          <year>2021</year>
          <pub-id pub-id-type="doi">10.5260/chara.21.2.8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kincaid</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Fishburne</surname>
              <given-names>RP</given-names>
            </name>
            <name name-style="western">
              <surname>Rogers</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Chissom</surname>
              <given-names>BS</given-names>
            </name>
          </person-group>
          <article-title>Derivation Of new readability formulas (Automated Readability Index, Fog Count And Flesch Reading Ease Formula) for navy enlisted personnel</article-title>
          <source>Institute for Simulation and Training</source>
          <year>1975</year>
          <volume>56</volume>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://stars.library.ucf.edu/istlibrary/56"/>
          </comment>
          <pub-id pub-id-type="doi">10.21236/ada006655</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mihalcea</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tarau</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>TextRank: Bringing Order into Text</article-title>
          <year>2004</year>
          <conf-name>Proceedings of the Conference on Empirical Methods in Natural Language Processing</conf-name>
          <conf-date>August 01, 2004</conf-date>
          <conf-loc>Barcelona, Spain</conf-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <fpage>404</fpage>
          <lpage>411</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/W04-3252.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Schenck</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Faithful AI in medicine: a systematic review with large language models and beyond</article-title>
          <source>medRxiv. Preprint posted online on July 01, 2023</source>
          <year>2023</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37398329"/>
          </comment>
          <pub-id pub-id-type="doi">10.1101/2023.04.18.23288752</pub-id>
          <pub-id pub-id-type="medline">37398329</pub-id>
          <pub-id pub-id-type="pii">2023.04.18.23288752</pub-id>
          <pub-id pub-id-type="pmcid">PMC10312867</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fleming</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Lozano</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Haberkorn</surname>
              <given-names>WJ</given-names>
            </name>
            <name name-style="western">
              <surname>Jindal</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Reis</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Thapa</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Blankemeier</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Genkins</surname>
              <given-names>JZ</given-names>
            </name>
            <name name-style="western">
              <surname>Steinberg</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Nayak</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Chiang</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Callahan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Huo</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Gatidis</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Adams</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Fayanju</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Savage</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Goh</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Chaudhari</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Aghaeepour</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Sharp</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Pfeffer</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Morse</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Brunskill</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Fries</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>MedAlign: a clinician-generated dataset for instruction following with electronic medical records</article-title>
          <year>2024</year>
          <conf-name>Proceedings of the 38th AAAI Conference on Artificial Intelligence</conf-name>
          <conf-date>February 20-27, 2024</conf-date>
          <conf-loc>Vancouver, Canada</conf-loc>
          <fpage>22021</fpage>
          <lpage>22030</lpage>
          <pub-id pub-id-type="doi">10.1609/aaai.v38i20.30205</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Blum</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>She</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Large Language models on wikipedia-style survey generation: an evaluation in NLP concepts</article-title>
          <source>ArXiv. Preprint posted online on May 23, 2024</source>
          <year>2024</year>
          <pub-id pub-id-type="doi">10.48550/ARXIV.2308.10410</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ouyang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>She</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lecue</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Leveraging large language models for concept graph recovery and question answering in NLP education</article-title>
          <source>ArXiv. Preprint posted online on February 22, 2024</source>
          <year>2024</year>
          <pub-id pub-id-type="doi">10.48550/ARXIV.2402.14293</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ke</surname>
              <given-names>YH</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lie</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>TXY</given-names>
            </name>
            <name name-style="western">
              <surname>Abdullah</surname>
              <given-names>HR</given-names>
            </name>
            <name name-style="western">
              <surname>Ting</surname>
              <given-names>DSW</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Enhancing diagnostic accuracy through multi-agent conversations: using large language models to mitigate cognitive bias</article-title>
          <source>ArXiv. Preprint posted online on May 12, 2024</source>
          <year>2024</year>
          <pub-id pub-id-type="doi">10.48550/ARXIV.2401.14589</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tian</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Yeganova</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>PT</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Comeau</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Islamaj</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kapoor</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Opportunities and challenges for ChatGPT and large language models in biomedicine and health</article-title>
          <source>Brief Bioinform</source>
          <year>2023</year>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>bbad493</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38168838"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bib/bbad493</pub-id>
          <pub-id pub-id-type="medline">38168838</pub-id>
          <pub-id pub-id-type="pii">7505071</pub-id>
          <pub-id pub-id-type="pmcid">PMC10762511</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ning</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Teixayavong</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Savulescu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nagaraj</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Miao</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mertens</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ting</surname>
              <given-names>DSW</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>JCL</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dunn</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vaughan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>MEH</given-names>
            </name>
            <name name-style="western">
              <surname>Sung</surname>
              <given-names>JJY</given-names>
            </name>
            <name name-style="western">
              <surname>Topol</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Generative artificial intelligence in healthcare: ethical considerations and assessment checklist</article-title>
          <source>ArXiv. Preprint posted online on February 23, 2024</source>
          <year>2024</year>
          <pub-id pub-id-type="doi">10.48550/ARXIV.2311.02107</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Nair</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Ke</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>D’Agostino</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ning</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Disparities in clinical studies of AI-enabled applications from a global perspective</article-title>
          <source>NPJ Digit Med</source>
          <year>2024</year>
          <volume>7</volume>
          <fpage>209</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-024-01212-7"/>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
