<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="review-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v27i1e64486</article-id>
      <article-id pub-id-type="pmid">40305085</article-id>
      <article-id pub-id-type="doi">10.2196/64486</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Review</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Review</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Accuracy of Large Language Models When Answering Clinical Research Questions: Systematic Review and Network Meta-Analysis</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Ma</surname>
            <given-names>Xiaomeng</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Lotfinia</surname>
            <given-names>Mahshad</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Zhang</surname>
            <given-names>Xiao-Meng</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Ling</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1970-0862</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Jinglin</given-names>
          </name>
          <degrees>BD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0004-4680-1548</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Zhuang</surname>
            <given-names>Boyang</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0009-2162-7076</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>Shasha</given-names>
          </name>
          <degrees>BD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0003-3554-5828</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Fang</surname>
            <given-names>Meilin</given-names>
          </name>
          <degrees>BD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0006-3499-9168</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Cunze</given-names>
          </name>
          <degrees>BD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7751-1242</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Wen</given-names>
          </name>
          <degrees>BD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0005-0542-7489</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Mohan</given-names>
          </name>
          <degrees>BD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0001-1786-0176</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Gong</surname>
            <given-names>Shurong</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <address>
            <institution>The Third Department of Critical Care Medicine</institution>
            <institution>Fuzhou University Affiliated Provincial Hospital</institution>
            <institution>Shengli Clinical Medical College, Fujian Medical University</institution>
            <addr-line>No.134 Dongjie Road</addr-line>
            <addr-line>Fuzhou, Fujian, 350001</addr-line>
            <country>China</country>
            <phone>86 15060677447</phone>
            <email>shurong_gong@fjmu.edu.cn</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1746-8198</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Fuzhou University Affiliated Provincial Hospital</institution>
        <institution>Shengli Clinical Medical College</institution>
        <institution>Fujian Medical University</institution>
        <addr-line>Fuzhou</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>School of Pharmacy</institution>
        <institution>Fujian Medical University</institution>
        <addr-line>Fuzhou</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Fujian Center For Drug Evaluation and Monitoring</institution>
        <addr-line>Fuzhou</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>School of Pharmacy</institution>
        <institution>Fujian University of Traditional Chinese Medicine</institution>
        <addr-line>Fuzhou</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>The Third Department of Critical Care Medicine</institution>
        <institution>Fuzhou University Affiliated Provincial Hospital</institution>
        <institution>Shengli Clinical Medical College, Fujian Medical University</institution>
        <addr-line>Fuzhou, Fujian</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Shurong Gong <email>shurong_gong@fjmu.edu.cn</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2025</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>30</day>
        <month>4</month>
        <year>2025</year>
      </pub-date>
      <volume>27</volume>
      <elocation-id>e64486</elocation-id>
      <history>
        <date date-type="received">
          <day>18</day>
          <month>7</month>
          <year>2024</year>
        </date>
        <date date-type="rev-request">
          <day>14</day>
          <month>10</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>4</day>
          <month>2</month>
          <year>2025</year>
        </date>
        <date date-type="accepted">
          <day>3</day>
          <month>4</month>
          <year>2025</year>
        </date>
      </history>
      <copyright-statement>©Ling Wang, Jinglin Li, Boyang Zhuang, Shasha Huang, Meilin Fang, Cunze Wang, Wen Li, Mohan Zhang, Shurong Gong. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 30.04.2025.</copyright-statement>
      <copyright-year>2025</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2025/1/e64486" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Large language models (LLMs) have flourished and gradually become an important research and application direction in the medical field. However, due to the high degree of specialization, complexity, and specificity of medicine, which results in extremely high accuracy requirements, controversy remains about whether LLMs can be used in the medical field. More studies have evaluated the performance of various types of LLMs in medicine, but the conclusions are inconsistent.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study uses a network meta-analysis (NMA) to assess the accuracy of LLMs when answering clinical research questions to provide high-level evidence-based evidence for its future development and application in the medical field.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>In this systematic review and NMA, we searched PubMed, Embase, Web of Science, and Scopus from inception until October 14, 2024. Studies on the accuracy of LLMs when answering clinical research questions were included and screened by reading published reports. The systematic review and NMA were conducted to compare the accuracy of different LLMs when answering clinical research questions, including objective questions, open-ended questions, top 1 diagnosis, top 3 diagnosis, top 5 diagnosis, and triage and classification. The NMA was performed using Bayesian frequency theory methods. Indirect intercomparisons between programs were performed using a grading scale. A larger surface under the cumulative ranking curve (SUCRA) value indicates a higher ranking of the corresponding LLM accuracy.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The systematic review and NMA examined 168 articles encompassing 35,896 questions and 3063 clinical cases. Of the 168 studies, 40 (23.8%) were considered to have a low risk of bias, 128 (76.2%) had a moderate risk, and none were rated as having a high risk. ChatGPT-4o (SUCRA=0.9207) demonstrated strong performance in terms of accuracy for objective questions, followed by Aeyeconsult (SUCRA=0.9187) and ChatGPT-4 (SUCRA=0.8087). ChatGPT-4 (SUCRA=0.8708) excelled at answering open-ended questions. In terms of accuracy for top 1 diagnosis and top 3 diagnosis of clinical cases, human experts (SUCRA=0.9001 and SUCRA=0.7126, respectively) ranked the highest, while Claude 3 Opus (SUCRA=0.9672) performed well at the top 5 diagnosis. Gemini (SUCRA=0.9649) had the highest rated SUCRA value for accuracy in the area of triage and classification.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our study indicates that ChatGPT-4o has an advantage when answering objective questions. For open-ended questions, ChatGPT-4 may be more credible. Humans are more accurate at the top 1 diagnosis and top 3 diagnosis. Claude 3 Opus performs better at the top 5 diagnosis, while for triage and classification, Gemini is more advantageous. This analysis offers valuable insights for clinicians and medical practitioners, empowering them to effectively leverage LLMs for improved decision-making in learning, diagnosis, and management of various clinical scenarios.</p>
        </sec>
        <sec sec-type="trial registration">
          <title>Trial Registration</title>
          <p>PROSPERO CRD42024558245; https://www.crd.york.ac.uk/PROSPERO/view/CRD42024558245</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>large language models</kwd>
        <kwd>LLM</kwd>
        <kwd>clinical research questions</kwd>
        <kwd>accuracy</kwd>
        <kwd>network meta-analysis</kwd>
        <kwd>PRISMA</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Recent research has demonstrated the considerable success of large language models (LLMs) in a multitude of natural language tasks, including automatic summarization (the generation of a condensed version of a passage of text), machine translation (the automatic translation of text from one language to another), and question-and-answer systems (the construction of a system to automatically answer questions based on a passage of text) [<xref ref-type="bibr" rid="ref1">1</xref>]. In this context, with the development of big biomedical data and artificial intelligence, the emergence of flexible natural language processing models such as ChatGPT provides a number of new possibilities for health care and biomedical research and has the potential to be a turning point in the field [<xref ref-type="bibr" rid="ref2">2</xref>-<xref ref-type="bibr" rid="ref4">4</xref>].</p>
      <p>Although LLMs have shown great potential in the medical field, medicine is a demanding field, it is associated with life, and its complexity as well as specificity mean that any application must meet extremely high standards of accuracy. Controversy remains about whether LLMs can be applied to the medical field. Mu and He [<xref ref-type="bibr" rid="ref5">5</xref>] reviewed the potential applications and challenges of ChatGPT in health care, noting that a lack of understanding of medical knowledge and specialized medical backgrounds hinder the ability of ChatGPT to delve into the complexity of medical concepts and terminology. Consequently, the capacity of ChatGPT to address specific medical queries, diagnose ailments, or furnish precise medical recommendations is restricted. Another study noted that the role of LLMs in health care may be limited by the presence of bias in training materials, their tendency to “hallucinate,” and ethical and legal considerations when LLMs provide inaccurate advice that leads to patient harm, as well as patient privacy issues [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
      <p>Given the controversy over the application of LLMs in medicine and the continuous emergence and versioning of LLMs, more research has been devoted to evaluating the performance of various LLMs in medicine to provide stronger evidence. In addition to ChatGPT developed by OpenAI, the performance of many other LLMs such as Microsoft (eg, Copilot [<xref ref-type="bibr" rid="ref7">7</xref>]), Google (eg, Gemini [<xref ref-type="bibr" rid="ref8">8</xref>]), and Meta (eg, LLaMA [<xref ref-type="bibr" rid="ref9">9</xref>]) in the medical domain has also been compared. Many aspects of assessment have been included, such as medical exams [<xref ref-type="bibr" rid="ref10">10</xref>], case text diagnosis [<xref ref-type="bibr" rid="ref11">11</xref>], and disease classification or grading [<xref ref-type="bibr" rid="ref12">12</xref>].</p>
      <p>Unfortunately, there are differences in the performance of different LLMs in different studies. For example, in a study by Vaishya et al [<xref ref-type="bibr" rid="ref13">13</xref>] that explored the performance of ChatGPT-3.5, ChatGPT-4, and Google Bard when answering 120 multiple-choice questions, the results showed that Google Bard had 100% accuracy and was significantly more accurate than both ChatGPT-3.5 and ChatGPT-4 (<italic>P</italic>&lt;.001). Another study showed that ChatGPT-4 was more accurate than Google Bard (83% vs 76%) [<xref ref-type="bibr" rid="ref14">14</xref>]. At present, most related research is limited to a single type of LLM [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>] or a specific domain area [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>], and there is no high-level evidence comparing the accuracy rankings of different LLMs when responding to clinical research questions.</p>
      <p>Therefore, this study aimed to compare the accuracy of different LLMs when answering clinical research questions, including objective questions, open-ended questions, top 1 diagnosis, top 3 diagnosis, top 5 diagnosis, and triage and classification. This study aimed to provide high-level evidence-based support for future clinical applications, enabling clinical workers to better use LLMs to make more accurate and informed decisions for future learning, diagnosis, and different clinical scenarios.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Network Meta-Analysis</title>
        <p>The network meta-analysis (NMA) was based on the PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) reporting guidelines. The PRISMA checklist is shown in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. The Bayesian approach permits the indirect comparison of performance between a range of LLMs that were not explicitly articulated throughout the experiment. The study protocol was defined and registered in the PROSPERO database prior to the commencement of the study.</p>
      </sec>
      <sec>
        <title>Search Strategy and Selection Criteria</title>
        <p>A computer search of the PubMed, Embase, Web of Science, and Scopus databases was conducted to identify relevant studies on the accuracy of different LLMs when answering questions in the medical field. The last search was updated to October 14, 2024, to identify studies published since the first search, with no restrictions on the type of study. When the results of a study were reported in multiple publications, we included the study with the richest and most recent findings. We also searched the list of literature on LLMs in medicine-related systematic reviews and manually searched the references included in the reviews for additional access to relevant literature. The search subject terms were “LLM,” “generative AI,” “open AI,” “Large language model,” “ChatGPT-3.5,” “ChatGPT-4,” “Google Bard,” and “Bing,” without any language restriction. The complete search strategies for all databases are shown in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
        <p>A combination of EndNote X9 deduplication and manual deduplication was used to screen the literature in accordance with the developed inclusion criteria. The results of the literature searches conducted in different databases were then combined to create a new information database, which could be downloaded in full text. Independent review and assessment of the titles, abstracts, and full texts of the relevant literature were undertaken by 4 authors (LW, JL, BZ, and SH). The review encompassed studies using disparate LLMs systems to respond to medical queries. Letters, conference abstracts, editorials, reviews, and expert opinions for which no information was available were excluded from the review. In addition, the following studies were excluded: those that evaluated the performance of only 1 LLM; those that assessed the performance of 2 or more LLMs without specifying the LLM versions used (eg, the article only mentioned evaluating ChatGPT without mentioning ChatGPT-3.5, ChatGPT-4, or other versions), with the updated versions and timelines of various LLMs so far shown in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>; those that assessed the performance of 2 or more LLMs but did not provide data isolating their accuracy when answering different types of questions; and the questions included in the study contained images. In addition, to reduce bias, we excluded research on accessing LLMs through an application programming interface (API).</p>
      </sec>
      <sec>
        <title>Assessment of Results</title>
        <p>The primary outcomes were the accuracy of LLMs when answering medical questions. These included objective questions, open-ended questions, top 1 diagnosis, top 3 diagnosis, top 5 diagnosis, and triage and classification accuracy. Objective questions are exam questions with a clear, quantifiable answer that is usually predetermined, unique, or with a limited number of options. Open-ended questions are a type of question that does not have a fixed answer nor standardized answer. Diagnosis and triage and classification are open-ended questions, but most diagnostic questions end with “What is the most probable diagnosis?” whereas triage and classification questions end with “How would you classify this disease?” Corresponding examples are shown in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>.</p>
        <p>Accuracy for objective questions was calculated as the number of correctly answered questions divided by the total number of questions. For diagnosis and classification, accuracy was defined as the number of cases correctly diagnosed or triaged divided by the total number of cases. Specifically for open-ended questions, accuracy was determined based on the number of questions rated “good” or “accurate” on the accuracy scale divided by the total number of questions.</p>
      </sec>
      <sec>
        <title>Data Extraction</title>
        <p>The 4 researchers jointly extracted and verified the following data: (1) basic information about the included studies, such as study title and first author; (2) baseline characteristics and interventions of the study population; (3) key elements evaluated for risk of bias; and (4) outcome indicators and relevant outcome measure data. Our study involved extracting raw data from each study. In cases of disagreement, these were resolved through discussion and consultation with a third party.</p>
      </sec>
      <sec>
        <title>Quality Assessment</title>
        <p>Because they were cross-sectional studies, the quality of the included studies was evaluated using the Newcastle-Ottawa Scale [<xref ref-type="bibr" rid="ref19">19</xref>]. The quality assessment was conducted by 3 independent researchers (LW, JL, and BZ), with a fourth researcher (SH) resolving any disagreements. A low overall risk of bias was determined when the Newcastle-Ottawa Scale score ranged from 7 to 9, moderate risk was determined when the score was between 4 and 6, and high risk was determined when the score was 0 to 3.</p>
      </sec>
      <sec>
        <title>Statistical Analyses</title>
        <p>Statistical analyses were performed using Stata 18.0 and R (version 4.3.1), with the odds ratio (OR) as the analytical statistic. Accuracy was assessed using 95% CIs and the credible interval. NMA analyses were performed on different types of LLMs.</p>
        <p>The confidence of the NMA results estimates was assessed according to the Confidence in Network Meta-Analysis (CINEMA) methodology, which is broadly based on the Grading of Recommendations Assessment, Development, and Evaluation (GRADE). An NMA was conducted within a Bayesian framework using Markov chain Monte Carlo methods and was computed using the BUGSnet and GeMTC packages in R (V.4.3.1) software. A network graph was constructed for each LLM included in the experiment in order to facilitate a comparison of the performance of multiple LLMs. The consistency between direct and indirect evidence was evaluated using a node-splitting method when there was a closed loop. If the <italic>P</italic> value between the direct, indirect, and network comparisons of the 2 interventions was &gt;.05, we concluded that there was no statistical difference and consistency was good. The convergence of the network models derived from the Markov chain Monte Carlo simulations was assessed using trace and density plots. We used noninformative priors for all parameters and assumed common heterogeneity. Furthermore, for all LLMs, we determined the ranking probabilities, which were articulated as the surface under the cumulative ranking curve (SUCRA). Higher SUCRA values suggest superior accuracy in model ranking.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Literature Search and Selection</title>
        <p>A bibliographic search yielded 59,075 citations, of which 21,156 studies were identified as potential conditions based on abstract screening and retrieved for full text evaluation. Manual reading of the titles and abstracts of the remaining literature excluded 20,814 papers whose topics and interventions did not match the inclusion criteria for this study. Further reading of the full texts excluded the following: 174 articles that could not be separated nor extracted from the ending; 147  articles in which we were unable to separate outcome data, unable to extract outcome data, or detected issues related to images; 12 articles with unclear versions of the LLMs; and 8 articles that used an API to access LLMs. In addition, the full text of 7 articles was not available, resulting in the final inclusion of 168 articles from the literature. The literature screening process is shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Literature screening flowchart. API: application programming interface.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e64486_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Basic Characteristics of the Incorporated Literature</title>
        <p>To assess the accuracy of different LLMs when answering medical questions, a total of 168 studies underwent a screening process to determine their suitability for inclusion. A total of 35,896 questions and 3063 clinical cases were included in the study. The basic information of the 168 studies is presented in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>.</p>
      </sec>
      <sec>
        <title>Quality Assessment of the Included Studies</title>
        <p>In the quality assessment, 40 (40/168, 23.8%) studies were assessed as having a low overall risk of bias, while 128 (128/168, 76.2%) had a moderate overall risk of bias. No studies were identified as having a high overall risk of bias. The detailed quality assessment results for each study can be found in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>.</p>
      </sec>
      <sec>
        <title>Network Meta-Analysis</title>
        <sec>
          <title>Objective Questions</title>
          <p>The accuracy of LLMs when answering objective questions was reported in 105 studies [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref121">121</xref>]. The evidence network relationships are plotted in <xref rid="figure2" ref-type="fig">Figure 2</xref>A and involve 30 LLMs and a total of 33,838 multiple choice questions. Direct and indirect comparisons were formed for each LLM, partially forming a closed loop. The results of the indirect comparison are shown in <xref rid="figure3" ref-type="fig">Figure 3</xref> and <xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>. The red cells indicate there are statistically significant differences between the column-defining regimen and the row-defining regimen. The values in the green and blue cells are the logOR and 95% CI, respectively, from the comparison of the LLMs represented in the columns with the LLMs represented in the rows. A logOR value &lt;0 indicates that the accuracy of the LLM corresponding to a column is lower than the LLM corresponding to a row. A value &gt;0 indicates a higher accuracy. There was no evidence of statistically significant inconsistency (all <italic>P</italic>&gt;.05) in the node-splitting test for NMA, except for Claude 2 versus ChatGPT-4 (<italic>P</italic>=.04), Bing chat versus people (<italic>P</italic>=.004), and Perplexity versus people (<italic>P</italic>=.04; <xref ref-type="supplementary-material" rid="app8">Multimedia Appendix 8</xref>). The convergence of iterations was evaluated as good in trace and density plots, with the bandwidth tending toward 0 and reaching stability (<xref ref-type="supplementary-material" rid="app9">Multimedia Appendix 9</xref>). The best probability ranking showed that ChatGPT-4o (SUCRA=0.9207) ranked first in terms of accuracy when answering objective questions, Aeyeconsult (SUCRA=0.9187) ranked second, and ChatGPT-4 (SUCRA=0.8087) ranked third (<xref ref-type="table" rid="table1">Table 1</xref>, <xref rid="figure4" ref-type="fig">Figure 4</xref>A).</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Comparison network diagram of different outcomes, where larger nodes indicate more questions and thicker line segments indicate more questions between 2 types of large language models (LLMs) when answering (A) objective questions, (B) open-ended questions, (C) a top 1 diagnosis, (D) a top 3 diagnosis, (E) a top 5 diagnosis, and (F) triage and classification questions.</p>
            </caption>
            <graphic xlink:href="jmir_v27i1e64486_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Indirect comparison of the accuracy of large language models (LLMs) when answering objective questions: A: instructGPT; A1: LLaMA 2; B: GTP-3; B1: LLaMA 3; C: ChatGPT-3.5; D: ChatGPT-4; D1: Mistral Large; E: ChatGPT-4o; E1: people; F1: chatENT; G: Bard; G1: ChatSonic; H: PaLM2; H1: Aeyeconsult; I: Gemini; I1: Med-PaLM 2; K: Gemini 1.5 pro; L: Bing chat; M: Copilot; N: Perplexity; O: Perplexity Pro; P: Claude; Q: Claude-instant; R: Claude 2; T: Claude 3 Opus; U: Claude 3 Sonnet; W: LLaMA 7B; X: LLaMA 13B; Y: LLaMA 33B; Z: LLaMA 65B.</p>
            </caption>
            <graphic xlink:href="jmir_v27i1e64486_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Bayesian ranking results (surface under the cumulative ranking curve [SUCRA] value) of the network meta-analysis for each large language model (LLM).</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="150"/>
              <col width="150"/>
              <col width="160"/>
              <col width="120"/>
              <col width="120"/>
              <col width="120"/>
              <col width="180"/>
              <thead>
                <tr valign="top">
                  <td>LLM</td>
                  <td colspan="6">SUCRA</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Objective questions</td>
                  <td>Open-ended questions</td>
                  <td>Top 1 diagnosis</td>
                  <td>Top 3 diagnosis</td>
                  <td>Top 5 diagnosis</td>
                  <td>Triage and classification</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>instructGPT (A)</td>
                  <td>0.7805</td>
                  <td>—<sup>a</sup></td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>LLaMA 2 (A1)</td>
                  <td>0.2086</td>
                  <td>0.4629</td>
                  <td>0.1395</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>GTP-3 (B)</td>
                  <td>0.7704</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>LLaMA 3 (B1)</td>
                  <td>0.239</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>0.7405</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>ChatGPT-3.5 (C)</td>
                  <td>0.4343</td>
                  <td>0.5548</td>
                  <td>0.5039</td>
                  <td>0.565</td>
                  <td>0.5084</td>
                  <td>0.2093</td>
                </tr>
                <tr valign="top">
                  <td>Mixtral-8x7B (C1)</td>
                  <td>—</td>
                  <td>0.6224</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>ChatGPT-4 (D)</td>
                  <td>0.8087</td>
                  <td>0.8708</td>
                  <td>0.693</td>
                  <td>0.6302</td>
                  <td>0.8089</td>
                  <td>0.6185</td>
                </tr>
                <tr valign="top">
                  <td>Mistral Large (D1)</td>
                  <td>0.3842</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>ChatGPT-4o (E)</td>
                  <td>0.9207</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>People (E1)</td>
                  <td>0.6172</td>
                  <td>0.6067</td>
                  <td>0.9001</td>
                  <td>0.7126</td>
                  <td>0.6241</td>
                  <td>0.4934</td>
                </tr>
                <tr valign="top">
                  <td>chatENT (F1)</td>
                  <td>0.7687</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>Bard (G)</td>
                  <td>0.4443</td>
                  <td>0.3512</td>
                  <td>0.3353</td>
                  <td>0.4329</td>
                  <td>0.0722</td>
                  <td>0.5885</td>
                </tr>
                <tr valign="top">
                  <td>ChatSonic (G1)</td>
                  <td>0.4617</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>PaLM2 (H)</td>
                  <td>0.421</td>
                  <td>0.312</td>
                  <td>0.4496</td>
                  <td>—</td>
                  <td>—</td>
                  <td>0.5197</td>
                </tr>
                <tr valign="top">
                  <td>Aeyeconsult (H1)</td>
                  <td>0.9187</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>Gemini (I)</td>
                  <td>0.4543</td>
                  <td>0.6703</td>
                  <td>0.2812</td>
                  <td>—</td>
                  <td>0.2405</td>
                  <td>0.9649</td>
                </tr>
                <tr valign="top">
                  <td>Med-PaLM 2 (I1)</td>
                  <td>0.3919</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>OcularBERT (J1)</td>
                  <td>—</td>
                  <td>0.0176</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>Gemini 1.5 pro (K)</td>
                  <td>0.2449</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>0.7905</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>Doctor GPT (K1)</td>
                  <td>—</td>
                  <td>0.745</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>Bing chat (L)</td>
                  <td>0.728</td>
                  <td>0.23</td>
                  <td>0.2073</td>
                  <td>0.4499</td>
                  <td>0.2042</td>
                  <td>0.3391</td>
                </tr>
                <tr valign="top">
                  <td>Docs-GPT Beta (L1)</td>
                  <td>—</td>
                  <td>0.212</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>Copilot (M)</td>
                  <td>0.7038</td>
                  <td>—</td>
                  <td>0.5048</td>
                  <td>—</td>
                  <td>0.2633</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>WebMD (M1)</td>
                  <td>—</td>
                  <td>—</td>
                  <td>0.7511</td>
                  <td>0.1452</td>
                  <td>—</td>
                  <td>0.4348</td>
                </tr>
                <tr valign="top">
                  <td>Perplexity (N)</td>
                  <td>0.4424</td>
                  <td>—</td>
                  <td>0.3980</td>
                  <td>0.4367</td>
                  <td>0.2801</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>Ada Health (N1)</td>
                  <td>—</td>
                  <td>—</td>
                  <td>0.8363</td>
                  <td>0.6273</td>
                  <td>—</td>
                  <td>0.3319</td>
                </tr>
                <tr valign="top">
                  <td>Perplexity Pro (O)</td>
                  <td>0.3821</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>Claude (P)</td>
                  <td>0.5048</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>Claude-instant (Q)</td>
                  <td>0.4949</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>Claude 2 (R)</td>
                  <td>0.4928</td>
                  <td>0.5647</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>Claude 3 Opus (T)</td>
                  <td>0.7365</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>0.9672</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>Claude 3 Sonnet (U)</td>
                  <td>0.5094</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>LLaMA 7B (W)</td>
                  <td>0.1131</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>LLaMA 13B (X)</td>
                  <td>0.1365</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>LLaMA 33B (Y)</td>
                  <td>0.2147</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>LLaMA 65B (Z)</td>
                  <td>0.2721</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table1fn1">
                <p><sup>a</sup>Not applicable because the LLM was not in the network.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>Surface under the cumulative ranking curve (SUCRAs) for the accuracy, with higher rankings associated with larger outcome values, of different large language models (LLMs) when answering (A) objective questions, (B) open-ended questions, (C) the top 1 diagnosis, (D) the top 3 diagnosis, (E) the top 5 diagnosis, and (F) triage and classification questions. The letters in the keys indicate the following LLMs: A: instructGPT; A1: LLaMA 2; B: GTP-3; B1: LLaMA 3; C: ChatGPT-3.5; C1: Mixtral-8x7B; D: ChatGPT-4; D1: Mistral Large; E: ChatGPT-4o; E1: people; F1: chatENT; G: Bard; G1: ChatSonic; H: PaLM2; H1: Aeyeconsult; I: Gemini; I1: Med-PaLM 2; J1: OcularBERT; K: Gemini 1.5 pro; K1: Doctor GPT; L: Bing chat; L1: Docs-GPT Beta; M: Copilot; M1: WebMD; N: Perplexity; N1: Ada Health; O: Perplexity Pro; P: Claude; Q: Claude-instant; R: Claude 2; S: Claude 2.1; T: Claude 3 Opus; U: Claude 3 Sonnet; W: LLaMA 7B; X: LLaMA 13B; Y: LLaMA 33B; Z: LLaMA 65B.</p>
            </caption>
            <graphic xlink:href="jmir_v27i1e64486_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Subgroup Analysis</title>
          <p>We stratified the results based on the fields of the problem (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>0). Based on the results, we compared the accuracy of LLMs in 6 fields: ophthalmology, orthopedics, urology, dentistry, oncology, and radiology. In ophthalmology, the LLM with the highest accuracy was Aeyeconsult (SUCRA=0.8334), followed by ChatGPT-4 (SUCRA=0.6331) and PaLM2 (SUCRA=0.5517). In the field of orthopedics, the LLM accuracy rates, from highest to lowest, were for Bard (SUCRA=0.7219), people (SUCRA=0.6802), and Bing chat (SUCRA=0.4732). For urology, Bing chat (SUCRA=0.7905) was the most accurate, followed by people (SUCRA=0.6587) and ChatGPT-4 (SUCRA=0.5941). In dentistry, ChatGPT-4 (SUCRA=0.9473) was the most accurate, followed by Bard (SUCRA=0.7068) and Gemini (SUCRA=0.5535). ChatGPT-4 (SUCRA=0.9002) performed the best in oncology, followed by ChatGPT-4o (SUCRA=0.8998) and Claude (SUCRA=0.7159). In radiology, ChatGPT-4o (SUCRA=0.9053) performed the best, ChatGPT-4 (SUCRA=0.7777) was second, and Claude 3 Opus (SUCRA=0.6935) ranked third. The SUCRAs are shown in <xref rid="figure5" ref-type="fig">Figure 5</xref>.</p>
          <fig id="figure5" position="float">
            <label>Figure 5</label>
            <caption>
              <p>Surface under the cumulative ranking curve (SUCRAs) for the accuracy, with higher rankings associated with larger outcome values, of different large language models (LLMs) in (A) ophthalmology, (B) orthopedics, (C) urology, (D) dentistry, (E) oncology, and (F) radiology. The letters in the keys indicate the following LLMs: C: ChatGPT-3.5; D: ChatGPT-4; E: ChatGPT-4o; E1=people; G: Bard; H: PaLM2; H1: Aeyeconsult; I: Gemini; L: Bing chat; P: Claude; T: Claude 3 Opus; U: Claude 3 Sonnet; W: LLaMA 7B; X: LLaMA 13B; Y: LLaMA 33B; Z: LLaMA 65B.</p>
            </caption>
            <graphic xlink:href="jmir_v27i1e64486_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Open-Ended Questions</title>
          <p>The accuracy of the LLMs when responding to open-ended questions was examined in 34 studies [<xref ref-type="bibr" rid="ref122">122</xref>-<xref ref-type="bibr" rid="ref155">155</xref>]. The relationships within the evidence network are plotted in <xref rid="figure2" ref-type="fig">Figure 2</xref>B and include 14 LLMs and a total of 2026 open-ended questions. Direct and indirect comparisons were formed for each LLM, partially forming a closed loop. The results of the indirect comparison are presented in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>0, where red cells indicate statistically significant differences between the column-defining regimen and the row-defining regimen (<xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>). There was no evidence of a statistically significant inconsistency (all <italic>P</italic>&gt;.05) in the node-splitting test for the NMA, except for Bard versus ChatGPT-3.5 (<italic>P</italic>=.02; <xref ref-type="supplementary-material" rid="app8">Multimedia Appendix 8</xref>). The trace and density plots are shown in <xref ref-type="supplementary-material" rid="app9">Multimedia Appendix 9</xref><bold>,</bold> and from the results, the iterative convergence was good. The best probability ranking indicated that ChatGPT-4 (SUCRA=0.8708) exhibited the highest accuracy when answering open-ended questions, followed by Claude 2.1 (SUCRA=0.7796) and Doctor GPT (SUCRA=0.7450; <xref ref-type="table" rid="table1">Table 1</xref>, <xref rid="figure4" ref-type="fig">Figure 4</xref>B).</p>
        </sec>
        <sec>
          <title>Top 1 Diagnosis, Top 3 Diagnosis, and Top 5 Diagnosis</title>
          <p>The accuracy of the top 1 diagnosis in clinical cases by LLMs was reported in 19 studies [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref156">156</xref>-<xref ref-type="bibr" rid="ref173">173</xref>]. The evidence network relationship diagram is shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>C and involves 12 LLMs and a total of 1266 clinical cases. The accuracy of LLMs for the top 3 diagnosis was reported in 7 studies [<xref ref-type="bibr" rid="ref158">158</xref>,<xref ref-type="bibr" rid="ref161">161</xref>,<xref ref-type="bibr" rid="ref169">169</xref>,<xref ref-type="bibr" rid="ref171">171</xref>,<xref ref-type="bibr" rid="ref174">174</xref>-<xref ref-type="bibr" rid="ref176">176</xref>]. The evidence network relationships are plotted in <xref rid="figure2" ref-type="fig">Figure 2</xref>D and involve 8 LLMs and a total of 453 clinical cases. The accuracy of LLMs for the top 5 diagnosis in clinical cases was reported in 7 studies [<xref ref-type="bibr" rid="ref158">158</xref>,<xref ref-type="bibr" rid="ref167">167</xref>,<xref ref-type="bibr" rid="ref168">168</xref>,<xref ref-type="bibr" rid="ref173">173</xref>,<xref ref-type="bibr" rid="ref177">177</xref>-<xref ref-type="bibr" rid="ref179">179</xref>]. The evidence network relationships are plotted in <xref rid="figure2" ref-type="fig">Figure 2</xref>E and involve 11 LLMs and a total of 443 clinical cases. Each LLM formed direct and indirect comparisons, partially closing the loop.</p>
          <p>In terms of the top 1 diagnosis and top 5 diagnosis, the results of the indirect comparison are presented in <xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>, where red cells indicate statistically significant differences between the column-defining regimen and the row-defining regimen. For the top 3 diagnosis, there was no statistical difference (all <italic>P</italic>&gt;.05) in the comparisons between the LLMs (<xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>). There was no evidence of a statistically significant inconsistency (all <italic>P</italic>&gt;.05) for the top 1 diagnosis, except for Ada Health versus ChatGPT-3.5 (<italic>P</italic>=.04). For the top 3 diagnosis and top 5 diagnosis, all <italic>P</italic> were &gt;.05 in the node-splitting test for the NMA (<xref ref-type="supplementary-material" rid="app8">Multimedia Appendix 8</xref>). Iterative convergence was good, as shown by the trace and density plots (<xref ref-type="supplementary-material" rid="app9">Multimedia Appendix 9</xref>). The best probability ranking showed that, in terms of accuracy of the top 1 diagnosis in clinical cases, people ranked first (SUCRA=0.9001), Ada Health ranked second (SUCRA=0.8363), and WebMD ranked third (SUCRA=0.7511; <xref ref-type="table" rid="table1">Table 1</xref>, <xref rid="figure4" ref-type="fig">Figure 4</xref>C). In terms of the accuracy of the top 3 diagnosis, people ranked first (SUCRA=0.7126), ChatGPT-4 ranked second (SUCRA=0.6302), and Ada Health ranked third (SUCRA=0.6273; <xref ref-type="table" rid="table1">Table 1</xref>, <xref rid="figure4" ref-type="fig">Figure 4</xref>D). For the accuracy of the top 5 diagnosis, Claude 3 Opus ranked first (SUCRA=0.9672), ChatGPT-4 ranked second (SUCRA=0.8089), and Gemini 1.5 pro ranked third (SUCRA=0.7905; <xref ref-type="table" rid="table1">Table 1</xref>, <xref rid="figure4" ref-type="fig">Figure 4</xref>E).</p>
        </sec>
        <sec>
          <title>Triage and Classification</title>
          <p>The accuracy of LLMs in triage and classification was reported in 7 studies [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref167">167</xref>,<xref ref-type="bibr" rid="ref169">169</xref>,<xref ref-type="bibr" rid="ref174">174</xref>,<xref ref-type="bibr" rid="ref180">180</xref>-<xref ref-type="bibr" rid="ref182">182</xref>]. The evidence network relationships are plotted in <xref rid="figure2" ref-type="fig">Figure 2</xref>F and involve 9 LLMs and a total of 901 clinical cases. Each LLM formed direct and indirect comparisons, partially closing the loop. The results of the indirect comparison are shown in <xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>. There were significant differences between Gemini and ChatGPT-3.5, ChatGPT-4, or Bing chat (<italic>P&lt;</italic>.05). There was no evidence of a statistically significant inconsistency (all <italic>P</italic>&gt;.05) in the node-splitting test for the NMA, except for ChatGPT-3.5 versus ChatGPT-4 (<italic>P</italic>=.045; <xref ref-type="supplementary-material" rid="app8">Multimedia Appendix 8</xref>). Iterative convergence was good, as shown by the trace and density plots (<xref ref-type="supplementary-material" rid="app9">Multimedia Appendix 9</xref>). The best probability ranking showed that, for the accuracy of triage and classification, Gemini ranked first (SUCRA=0.9649), ChatGPT-4 ranked second (SUCRA=0.6185), and Bard ranked third (SUCRA=0.5885), as shown in <xref ref-type="table" rid="table1">Table 1</xref> and <xref rid="figure4" ref-type="fig">Figure 4</xref>F.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This study presents the most comprehensive meta-analysis to date on the accuracy of various LLMs when responding to medical queries, encompassing objective questions, open-ended questions, top 1 diagnosis, top 3 diagnosis, top 5 diagnosis, and triage and classification. Variations in accuracy among different LLMs were observed. ChatGPT-4o demonstrated the highest accuracy when answering objective questions, while ChatGPT-4 excelled at open-ended questions. The superior performance of people at the top 1 diagnosis and top 3 diagnosis suggests that human expertise is generally more dependable than LLMs in complex medical scenarios, while Claude 3 Opus seems to perform the best in the top 5 diagnosis. In terms of triage and classification, Gemini appeared to be more reliable.</p>
        <p>In addition, we stratified LLMs according to the medical field in which the objective questions were located and explored their accuracy in 6 fields: ophthalmology, orthopedics, urology, dentistry, oncology, and radiology. We found that Aeyeconsult performed the best in ophthalmology, Bard performed the best in orthopedics, Bing chat performed the best in urology, ChatGPT-4 performed the best in both dentistry and oncology, and ChatGPT-4o had the highest accuracy in radiology.</p>
        <p>At present, language models based on transformer architecture, whether pretrained or fine-tuned using biomedical corpora, have been proven effective in a series of natural language processing benchmarks in the biomedical field [<xref ref-type="bibr" rid="ref183">183</xref>]. We attempted to analyze the reasons for the performance differences when different LLMs answer questions. Parameter size is an important factor affecting the accuracy of LLMs when answering questions. Research has found that, when the parameter size of the PaLM model is expanded from 8B to 40B, the accuracy of answering medical questions is doubled [<xref ref-type="bibr" rid="ref184">184</xref>]. However, the practicality of a model depends not only on its number of parameters but also on many factors such as its training data and architecture, fine-tuning protocols, and overall architecture [<xref ref-type="bibr" rid="ref185">185</xref>]. Taking GPT-4 as an example, it achieved a higher performance than its predecessor by adopting more advanced training data and architecture. The timeliness and accuracy of training data are also crucial for model performance. Today, models can not only rely on a limited set of pretraining data but also obtain the latest knowledge from the internet in real time. For example, Bing AI and Google Bard already have the ability to obtain real-time updates, and ChatGPT has also begun to follow suit by accepting plugins to expand its capabilities [<xref ref-type="bibr" rid="ref185">185</xref>,<xref ref-type="bibr" rid="ref186">186</xref>].</p>
        <p>In addition, we found that some models fine-tuned on the backend LLM can achieve higher accuracy and less energy consumption in specific fields. For example, in the field of ophthalmology, Aeyeconsult integrates many ophthalmic data sets based on GPT-4 for training and generation [<xref ref-type="bibr" rid="ref24">24</xref>]. This targeted training can significantly improve its performance in ophthalmic clinical tasks. Other possible data sources include clinical texts and accurate medical information, such as guidelines and peer-reviewed literature. In fact, there are already some models built or fine-tuned based on clinical text, such as SkinGPT-4 and ChatDoctor, which perform better overall than various general LLMs at biomedical natural language processing tasks [<xref ref-type="bibr" rid="ref187">187</xref>,<xref ref-type="bibr" rid="ref188">188</xref>].</p>
        <p>Progress on various grand prognostic models has been very rapid, with a newer, more arithmetically powerful version being released every few months. However, our results show that the newer versions do not necessarily outperform the older ones in terms of performance when measured as accuracy, possibly because the newer versions incorporate fewer studies, which may have biased the results somewhat. In addition, updated versions such as ChatGPT-4V provided multimodal models (eg, that can evaluate image problems), and these models may have a greater advantage for image evaluation, for example.</p>
        <p>Studies indicate LLMs outperform humans at exams like medical licensing, orthopedics, and pediatrics globally, highlighting LLMs’ potential as a study aid. For the top 1 diagnosis and top 3 diagnosis, human accuracy is higher than that of LLMs. Despite the fact that Claude 3 Opus outperformed humans in the top 5 diagnostic results, due to the high level of accuracy required in the medical field and the multifaceted information and complex decision-making involved in medical diagnosis, we still recommend that LLMs should only be used as an auxiliary tool to assist doctors with more efficient data analysis and preliminary diagnostic recommendations.</p>
        <p>Several meta-analyses have been conducted to assess the accuracy of LLMs in health care [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref189">189</xref>,<xref ref-type="bibr" rid="ref190">190</xref>]. However, it is very unfortunate that the LLMs included in these studies included ChatGPT only and that some of the studies simply evaluated its performance on exams. Some studies did not differentiate between the types of questions answered by ChatGPT, which led to a significant amount of heterogeneity between the studies, resulting in biased results.</p>
        <p>We acknowledge certain limitations in our study. First, for the top 3 diagnosis, top 5 diagnosis, and triage and classification, this may bias the results due to the number of included studies as well as the sample size, so caution is needed when interpreting these results. Although we minimized the heterogeneity of the research as much as possible, we cannot deny that the inclusion of different fields of study and the complexity of LLMs (such as different instructions and questioning dates) can affect the results of the study and generate heterogeneity. Therefore, caution should be exercised when interpreting the results. In addition, we did not assess the accuracy of multimodal grand prognostic models when solving medical image–related problems; with the development of artificial intelligence, more multimodal models are being developed, and in the future, these models will become indispensable in the exploration of image-based problems in the medical field.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>Existing studies suggest that ChatGPT-4o has an advantage for answering objective questions. For open-ended questions, ChatGPT-4 may be more credible. Humans are more accurate in the top 1 diagnosis and top 3 diagnosis of clinical cases. Claude 3 Opus performs better in the top 5 diagnosis, while for classification accuracy, Gemini is more advantageous. Although some LLMs excel at addressing medical queries, caution is advised due to the critical need for precision and rigor in medicine. Future high-quality studies and trials are necessary to gather more scientific evidence.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>PRISMA checklist.</p>
        <media xlink:href="jmir_v27i1e64486_app1.docx" xlink:title="DOCX File , 28 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Search strategy.</p>
        <media xlink:href="jmir_v27i1e64486_app2.docx" xlink:title="DOCX File , 14 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Versions and timelines of LLMs iterations.</p>
        <media xlink:href="jmir_v27i1e64486_app3.docx" xlink:title="DOCX File , 20 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Examples of the outcomes.</p>
        <media xlink:href="jmir_v27i1e64486_app4.docx" xlink:title="DOCX File , 1341 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Description of 168 studies included.</p>
        <media xlink:href="jmir_v27i1e64486_app5.docx" xlink:title="DOCX File , 196 KB"/>
      </supplementary-material>
      <supplementary-material id="app6">
        <label>Multimedia Appendix 6</label>
        <p>Quality assessment of observational study.</p>
        <media xlink:href="jmir_v27i1e64486_app6.docx" xlink:title="DOCX File , 66 KB"/>
      </supplementary-material>
      <supplementary-material id="app7">
        <label>Multimedia Appendix 7</label>
        <p>Indirect comparison results.</p>
        <media xlink:href="jmir_v27i1e64486_app7.docx" xlink:title="DOCX File , 1355 KB"/>
      </supplementary-material>
      <supplementary-material id="app8">
        <label>Multimedia Appendix 8</label>
        <p>Node splitting inconsistency test.</p>
        <media xlink:href="jmir_v27i1e64486_app8.docx" xlink:title="DOCX File , 2606 KB"/>
      </supplementary-material>
      <supplementary-material id="app9">
        <label>Multimedia Appendix 9</label>
        <p>Trace and density plots.</p>
        <media xlink:href="jmir_v27i1e64486_app9.docx" xlink:title="DOCX File , 3634 KB"/>
      </supplementary-material>
      <supplementary-material id="app10">
        <label>Multimedia Appendix 10</label>
        <p>Objective questions are stratified according to different fields of the questions.</p>
        <media xlink:href="jmir_v27i1e64486_app10.docx" xlink:title="DOCX File , 13 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">API</term>
          <def>
            <p>application programming interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CINEMA</term>
          <def>
            <p>Confidence in Network Meta-Analysis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">GRADE</term>
          <def>
            <p>Grading of Recommendations Assessment, Development, and Evaluation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">NMA</term>
          <def>
            <p>network meta-analysis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">OR</term>
          <def>
            <p>odds ratio</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">PRISMA</term>
          <def>
            <p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">SUCRA</term>
          <def>
            <p>surface under the cumulative ranking curve</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was supported by the Training Program for Young and Middle-aged Backbone Talents of Fujian Provincial Health Commission (grant number 2022GGA001), Natural Science Foundation of Fujian Province (grant number 2021J01395 and 2024J011032), Foundations of Department of Finance of Fujian Province (grant number Min Cai Zhi (2023) 830 and Min Cai Zhi (2024) 881), Joint Funding Projects for Innovation in Science and Technology of Fujian Province (grant number 2023Y9330), and Internal Supporting Project of Fuzhou University Affiliated Provincial Hospital (grant number 0080072220).</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The data sets generated or analyzed during this study are available from the corresponding author on reasonable request.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>All authors were involved in the conceptualization and design of the study and reviewed all documents and materials. LW, JL, BZ, and SH collected the data, performed data analysis, interpreted the results, and wrote the first draft of the manuscript. CW, WL, and MZ were involved in the development of the protocol for the systematic review and critically reviewed the results and the manuscript. MF and SG were involved in the development of the protocol and revised the manuscript. All authors read and approved the final manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Heacock</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Elias</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hentel</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>Reig</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Shih</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Moy</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT and other large language models are double-edged swords</article-title>
          <source>Radiology</source>
          <year>2023</year>
          <month>04</month>
          <volume>307</volume>
          <issue>2</issue>
          <fpage>e230163</fpage>
          <pub-id pub-id-type="doi">10.1148/radiol.230163</pub-id>
          <pub-id pub-id-type="medline">36700838</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>No authors listed</collab>
          </person-group>
          <article-title>Will ChatGPT transform healthcare?</article-title>
          <source>Nat Med</source>
          <year>2023</year>
          <month>03</month>
          <day>14</day>
          <volume>29</volume>
          <issue>3</issue>
          <fpage>505</fpage>
          <lpage>506</lpage>
          <pub-id pub-id-type="doi">10.1038/s41591-023-02289-5</pub-id>
          <pub-id pub-id-type="medline">36918736</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-023-02289-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Pinto-Powell</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Thesen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lindqwister</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chacko</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzalez</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bridges</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Schwendt</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Byrum</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fong</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shasavari</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hassanpour</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Preparing healthcare leaders of the digital age with an integrative artificial intelligence curriculum: a pilot study</article-title>
          <source>Med Educ Online</source>
          <year>2024</year>
          <month>12</month>
          <day>31</day>
          <volume>29</volume>
          <issue>1</issue>
          <fpage>2315684</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.tandfonline.com/doi/10.1080/10872981.2024.2315684?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/10872981.2024.2315684</pub-id>
          <pub-id pub-id-type="medline">38351737</pub-id>
          <pub-id pub-id-type="pmcid">PMC10868429</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sblendorio</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Dentamaro</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Lo Cascio</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Germini</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Piredda</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cicolini</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Integrating human expertise and automated methods for a dynamic and multi-parametric evaluation of large language models' feasibility in clinical decision-making</article-title>
          <source>Int J Med Inform</source>
          <year>2024</year>
          <month>08</month>
          <volume>188</volume>
          <fpage>105501</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1386-5056(24)00164-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2024.105501</pub-id>
          <pub-id pub-id-type="medline">38810498</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(24)00164-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The potential applications and challenges of ChatGPT in the medical field</article-title>
          <source>IJGM</source>
          <year>2024</year>
          <month>03</month>
          <volume>Volume 17</volume>
          <fpage>817</fpage>
          <lpage>826</lpage>
          <pub-id pub-id-type="doi">10.2147/ijgm.s456659</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Pillai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Paget</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Naugler</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Assessing the research landscape and clinical utility of large language models: a scoping review</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2024</year>
          <month>03</month>
          <day>12</day>
          <volume>24</volume>
          <issue>1</issue>
          <fpage>72</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-024-02459-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-024-02459-6</pub-id>
          <pub-id pub-id-type="medline">38475802</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-024-02459-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC10936025</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <article-title>Copilot</article-title>
          <source>Microsoft</source>
          <access-date>2025-04-21</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.microsoft.com/en-us/microsoft-copilot">https://www.microsoft.com/en-us/microsoft-copilot</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="web">
          <article-title>Gemini</article-title>
          <source>Google</source>
          <access-date>2025-04-21</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://gemini.google.com/">https://gemini.google.com/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="web">
          <article-title>Llama</article-title>
          <source>Meta</source>
          <access-date>2025-04-21</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://llama.meta.com/">https://llama.meta.com/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tsoutsanis</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Tsoutsanis</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of large language model performance on the Multi-Specialty Recruitment Assessment (MSRA) exam</article-title>
          <source>Comput Biol Med</source>
          <year>2024</year>
          <month>01</month>
          <volume>168</volume>
          <fpage>107794</fpage>
          <pub-id pub-id-type="doi">10.1016/j.compbiomed.2023.107794</pub-id>
          <pub-id pub-id-type="medline">38043471</pub-id>
          <pub-id pub-id-type="pii">S0010-4825(23)01259-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shukla</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Banerjee</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Verma</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>The comparison of ChatGPT 3.5, Microsoft Bing, and Google Gemini for diagnosing cases of neuro-ophthalmology</article-title>
          <source>Cureus</source>
          <year>2024</year>
          <month>04</month>
          <volume>16</volume>
          <issue>4</issue>
          <fpage>e58232</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38745784"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.58232</pub-id>
          <pub-id pub-id-type="medline">38745784</pub-id>
          <pub-id pub-id-type="pmcid">PMC11092423</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pressman</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Borna</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gomez-Cabello</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Haider</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Forte</surname>
              <given-names>AJ</given-names>
            </name>
          </person-group>
          <article-title>AI in hand surgery: assessing large language models in the classification and management of hand injuries</article-title>
          <source>J Clin Med</source>
          <year>2024</year>
          <month>05</month>
          <day>11</day>
          <volume>13</volume>
          <issue>10</issue>
          <fpage>2832</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=jcm13102832"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/jcm13102832</pub-id>
          <pub-id pub-id-type="medline">38792374</pub-id>
          <pub-id pub-id-type="pii">jcm13102832</pub-id>
          <pub-id pub-id-type="pmcid">PMC11122623</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vaishya</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Iyengar</surname>
              <given-names>KP</given-names>
            </name>
            <name name-style="western">
              <surname>Patralekh</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Botchu</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Shirodkar</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Jain</surname>
              <given-names>VK</given-names>
            </name>
            <name name-style="western">
              <surname>Vaish</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Scarlat</surname>
              <given-names>MM</given-names>
            </name>
          </person-group>
          <article-title>Effectiveness of AI-powered chatbots in responding to orthopaedic postgraduate exam questions-an observational study</article-title>
          <source>Int Orthop</source>
          <year>2024</year>
          <month>08</month>
          <day>15</day>
          <volume>48</volume>
          <issue>8</issue>
          <fpage>1963</fpage>
          <lpage>1969</lpage>
          <pub-id pub-id-type="doi">10.1007/s00264-024-06182-9</pub-id>
          <pub-id pub-id-type="medline">38619565</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00264-024-06182-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tessier</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Brar</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Malone</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>McKechnie</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kroh</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dang</surname>
              <given-names>JT</given-names>
            </name>
            <collab>ASMBS Artificial Intelligence and Digital Surgery Taskforce</collab>
          </person-group>
          <article-title>Performance of artificial intelligence in bariatric surgery: comparative analysis of ChatGPT-4, Bing, and Bard in the American Society for Metabolic and Bariatric Surgery textbook of bariatric surgery questions</article-title>
          <source>Surg Obes Relat Dis</source>
          <year>2024</year>
          <month>07</month>
          <volume>20</volume>
          <issue>7</issue>
          <fpage>609</fpage>
          <lpage>613</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1550-7289(24)00169-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.soard.2024.04.014</pub-id>
          <pub-id pub-id-type="medline">38782611</pub-id>
          <pub-id pub-id-type="pii">S1550-7289(24)00169-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Yao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of ChatGPT-generated medical responses: a systematic review and meta-analysis</article-title>
          <source>J Biomed Inform</source>
          <year>2024</year>
          <month>03</month>
          <volume>151</volume>
          <fpage>104620</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(24)00038-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2024.104620</pub-id>
          <pub-id pub-id-type="medline">38462064</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(24)00038-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kaboudi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Firouzbakht</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shahir Eftekhar</surname>
              <given-names>Mohammad</given-names>
            </name>
            <name name-style="western">
              <surname>Fayazbakhsh</surname>
              <given-names>Fatemeh</given-names>
            </name>
            <name name-style="western">
              <surname>Joharivarnoosfaderani</surname>
              <given-names>Niloufar</given-names>
            </name>
            <name name-style="western">
              <surname>Ghaderi</surname>
              <given-names>Salar</given-names>
            </name>
            <name name-style="western">
              <surname>Dehdashti</surname>
              <given-names>Mohammadreza</given-names>
            </name>
            <name name-style="western">
              <surname>Mohtasham Kia</surname>
              <given-names>Yasmin</given-names>
            </name>
            <name name-style="western">
              <surname>Afshari</surname>
              <given-names>Maryam</given-names>
            </name>
            <name name-style="western">
              <surname>Vasaghi-Gharamaleki</surname>
              <given-names>Maryam</given-names>
            </name>
            <name name-style="western">
              <surname>Haghani</surname>
              <given-names>Leila</given-names>
            </name>
            <name name-style="western">
              <surname>Moradzadeh</surname>
              <given-names>Zahra</given-names>
            </name>
            <name name-style="western">
              <surname>Khalaj</surname>
              <given-names>Fattaneh</given-names>
            </name>
            <name name-style="western">
              <surname>Mohammadi</surname>
              <given-names>Zahra</given-names>
            </name>
            <name name-style="western">
              <surname>Hasanabadi</surname>
              <given-names>Zahra</given-names>
            </name>
            <name name-style="western">
              <surname>Shahidi</surname>
              <given-names>Ramin</given-names>
            </name>
          </person-group>
          <article-title>Diagnostic accuracy of ChatGPT for patients' triage; a systematic review and meta-analysis</article-title>
          <source>Arch Acad Emerg Med</source>
          <year>2024</year>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>e60</fpage>
          <pub-id pub-id-type="doi">10.22037/aaem.v12i1.2384</pub-id>
          <pub-id pub-id-type="medline">39290765</pub-id>
          <pub-id pub-id-type="pmcid">PMC11407534</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Patil</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Serrato</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chisvo</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Arnaout</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>See</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>KT</given-names>
            </name>
          </person-group>
          <article-title>Large language models in neurosurgery: a systematic review and meta-analysis</article-title>
          <source>Acta Neurochir (Wien)</source>
          <year>2024</year>
          <month>11</month>
          <day>23</day>
          <volume>166</volume>
          <issue>1</issue>
          <fpage>475</fpage>
          <pub-id pub-id-type="doi">10.1007/s00701-024-06372-9</pub-id>
          <pub-id pub-id-type="medline">39579215</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00701-024-06372-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>HC</given-names>
            </name>
            <name name-style="western">
              <surname>Dang</surname>
              <given-names>HP</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Hoang</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>VA</given-names>
            </name>
          </person-group>
          <article-title>Accuracy of latest large language models in answering multiple choice questions in dentistry: a comparative study</article-title>
          <source>PLoS One</source>
          <year>2025</year>
          <month>1</month>
          <day>29</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>e0317423</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0317423"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0317423</pub-id>
          <pub-id pub-id-type="medline">39879192</pub-id>
          <pub-id pub-id-type="pii">PONE-D-24-40356</pub-id>
          <pub-id pub-id-type="pmcid">PMC11778630</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lo</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Mertz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Loeb</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Newcastle-Ottawa Scale: comparing reviewers' to authors' assessments</article-title>
          <source>BMC Med Res Methodol</source>
          <year>2014</year>
          <month>04</month>
          <day>01</day>
          <volume>14</volume>
          <fpage>45</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/1471-2288-14-45"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2288-14-45</pub-id>
          <pub-id pub-id-type="medline">24690082</pub-id>
          <pub-id pub-id-type="pii">1471-2288-14-45</pub-id>
          <pub-id pub-id-type="pmcid">PMC4021422</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Long</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Subburam</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lowe</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Dos Santos</surname>
              <given-names>André</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hwang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Saduka</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Horev</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Su</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Côté</surname>
              <given-names>David W J</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>ED</given-names>
            </name>
          </person-group>
          <article-title>ChatENT: augmented large language model for expert knowledge retrieval in otolaryngology-head and neck surgery</article-title>
          <source>Otolaryngol Head Neck Surg</source>
          <year>2024</year>
          <month>10</month>
          <day>19</day>
          <volume>171</volume>
          <issue>4</issue>
          <fpage>1042</fpage>
          <lpage>1051</lpage>
          <pub-id pub-id-type="doi">10.1002/ohn.864</pub-id>
          <pub-id pub-id-type="medline">38895862</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>BK</given-names>
            </name>
            <name name-style="western">
              <surname>Hua</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Milkovich</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Micieli</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT-3.5 and Bing Chat in ophthalmology: an updated evaluation of performance, readability, and informative sources</article-title>
          <source>Eye (Lond)</source>
          <year>2024</year>
          <month>07</month>
          <day>20</day>
          <volume>38</volume>
          <issue>10</issue>
          <fpage>1897</fpage>
          <lpage>1902</lpage>
          <pub-id pub-id-type="doi">10.1038/s41433-024-03037-w</pub-id>
          <pub-id pub-id-type="medline">38509182</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41433-024-03037-w</pub-id>
          <pub-id pub-id-type="pmcid">PMC11226422</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shieh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tran</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Freed</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Majety</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Assessing ChatGPT 4.0's test performance and clinical diagnostic accuracy on USMLE STEP 2 CK and clinical case reports</article-title>
          <source>Sci Rep</source>
          <year>2024</year>
          <month>04</month>
          <day>23</day>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>9330</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-024-58760-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-024-58760-x</pub-id>
          <pub-id pub-id-type="medline">38654011</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-024-58760-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC11039662</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sarangi</surname>
              <given-names>PK</given-names>
            </name>
            <name name-style="western">
              <surname>Narayan</surname>
              <given-names>RK</given-names>
            </name>
            <name name-style="western">
              <surname>Mohakud</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Vats</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sahani</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mondal</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Assessing the capability of ChatGPT, Google Bard, and Microsoft Bing in solving radiology case vignettes</article-title>
          <source>Indian J Radiol Imaging</source>
          <year>2024</year>
          <month>04</month>
          <day>29</day>
          <volume>34</volume>
          <issue>2</issue>
          <fpage>276</fpage>
          <lpage>282</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.thieme-connect.com/DOI/DOI?10.1055/s-0043-1777746"/>
          </comment>
          <pub-id pub-id-type="doi">10.1055/s-0043-1777746</pub-id>
          <pub-id pub-id-type="medline">38549897</pub-id>
          <pub-id pub-id-type="pii">IJRI-23-9-2963</pub-id>
          <pub-id pub-id-type="pmcid">PMC10972658</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Singer</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Chow</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Teng</surname>
              <given-names>CC</given-names>
            </name>
          </person-group>
          <article-title>Development and evaluation of Aeyeconsult: a novel ophthalmology chatbot leveraging verified textbook knowledge and GPT-4</article-title>
          <source>J Surg Educ</source>
          <year>2024</year>
          <month>03</month>
          <volume>81</volume>
          <issue>3</issue>
          <fpage>438</fpage>
          <lpage>443</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jsurg.2023.11.019</pub-id>
          <pub-id pub-id-type="medline">38135548</pub-id>
          <pub-id pub-id-type="pii">S1931-7204(23)00432-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hanna</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>LR</given-names>
            </name>
            <name name-style="western">
              <surname>Mhaskar</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hanna</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Performance of language models on the family medicine in-training exam</article-title>
          <source>Fam Med</source>
          <year>2024</year>
          <month>10</month>
          <day>2</day>
          <volume>56</volume>
          <issue>9</issue>
          <fpage>555</fpage>
          <lpage>560</lpage>
          <pub-id pub-id-type="doi">10.22454/fammed.2024.233738</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kadoya</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Arai</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tanaka</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kimura</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tozuka</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Yasui</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Hayashi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Katsuta</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Takahashi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Inoue</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Jingu</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Assessing knowledge about medical physics in language-generative AI with large language model: using the medical physicist exam</article-title>
          <source>Radiol Phys Technol</source>
          <year>2024</year>
          <month>12</month>
          <day>10</day>
          <volume>17</volume>
          <issue>4</issue>
          <fpage>929</fpage>
          <lpage>937</lpage>
          <pub-id pub-id-type="doi">10.1007/s12194-024-00838-2</pub-id>
          <pub-id pub-id-type="medline">39254919</pub-id>
          <pub-id pub-id-type="pii">10.1007/s12194-024-00838-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sallam</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Mahzoum</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Almutawaa</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Alhashash</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Dashti</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>AlSafy</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Almutairi</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Barakat</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The performance of OpenAI ChatGPT-4 and Google Gemini in virology multiple-choice questions: a comparative analysis of English and Arabic responses</article-title>
          <source>BMC Res Notes</source>
          <year>2024</year>
          <month>09</month>
          <day>03</day>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>247</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcresnotes.biomedcentral.com/articles/10.1186/s13104-024-06920-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13104-024-06920-7</pub-id>
          <pub-id pub-id-type="medline">39228001</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13104-024-06920-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC11373487</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gravina</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Pellegrino</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Palladino</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Imperio</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ventura</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Federico</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Charting new AI education in gastroenterology: cross-sectional evaluation of ChatGPT and perplexity AI in medical residency exam</article-title>
          <source>Dig Liver Dis</source>
          <year>2024</year>
          <month>08</month>
          <volume>56</volume>
          <issue>8</issue>
          <fpage>1304</fpage>
          <lpage>1311</lpage>
          <pub-id pub-id-type="doi">10.1016/j.dld.2024.02.019</pub-id>
          <pub-id pub-id-type="medline">38503659</pub-id>
          <pub-id pub-id-type="pii">S1590-8658(24)00302-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Passby</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jenko</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wernham</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT on specialty certificate examination in dermatology multiple-choice questions</article-title>
          <source>Clin Exp Dermatol</source>
          <year>2024</year>
          <month>06</month>
          <day>25</day>
          <volume>49</volume>
          <issue>7</issue>
          <fpage>722</fpage>
          <lpage>727</lpage>
          <pub-id pub-id-type="doi">10.1093/ced/llad197</pub-id>
          <pub-id pub-id-type="medline">37264670</pub-id>
          <pub-id pub-id-type="pii">7188526</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sabri</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Saleh</surname>
              <given-names>MHA</given-names>
            </name>
            <name name-style="western">
              <surname>Hazrati</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Misch</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>PS</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Barootchi</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Performance of three artificial intelligence (AI)-based large language models in standardized testing; implications for AI-assisted dental education</article-title>
          <source>J Periodontal Res</source>
          <year>2025</year>
          <month>02</month>
          <day>18</day>
          <volume>60</volume>
          <issue>2</issue>
          <fpage>121</fpage>
          <lpage>133</lpage>
          <pub-id pub-id-type="doi">10.1111/jre.13323</pub-id>
          <pub-id pub-id-type="medline">39030766</pub-id>
          <pub-id pub-id-type="pmcid">PMC11873669</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Çamur</surname>
              <given-names>Eren</given-names>
            </name>
            <name name-style="western">
              <surname>Cesur</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Güneş</surname>
              <given-names>Yasin Celal</given-names>
            </name>
          </person-group>
          <article-title>Can large language models be new supportive tools in coronary computed tomography angiography reporting?</article-title>
          <source>Clin Imaging</source>
          <year>2024</year>
          <month>10</month>
          <volume>114</volume>
          <fpage>110271</fpage>
          <pub-id pub-id-type="doi">10.1016/j.clinimag.2024.110271</pub-id>
          <pub-id pub-id-type="medline">39236553</pub-id>
          <pub-id pub-id-type="pii">S0899-7071(24)00201-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lubitz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Latario</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Performance of two artificial intelligence generative language models on the orthopaedic in-training examination</article-title>
          <source>Orthopedics</source>
          <year>2024</year>
          <month>05</month>
          <volume>47</volume>
          <issue>3</issue>
          <fpage>e146</fpage>
          <lpage>e150</lpage>
          <pub-id pub-id-type="doi">10.3928/01477447-20240304-02</pub-id>
          <pub-id pub-id-type="medline">38466827</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hamid</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jhaveri</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Suthar</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Comparative evaluation of AI models such as ChatGPT 3.5, ChatGPT 4.0, and Google Gemini in neuroradiology diagnostics</article-title>
          <source>Cureus</source>
          <year>2024</year>
          <month>08</month>
          <volume>16</volume>
          <issue>8</issue>
          <fpage>e67766</fpage>
          <pub-id pub-id-type="doi">10.7759/cureus.67766</pub-id>
          <pub-id pub-id-type="medline">39323714</pub-id>
          <pub-id pub-id-type="pmcid">PMC11422621</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Jong Won</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Young Hwan</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>Sang O</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Kyeong Ryong</given-names>
            </name>
          </person-group>
          <article-title>Comparison of the problem-solving performance of ChatGPT-3.5, ChatGPT-4, Bing Chat, and Bard for the Korean emergency medicine board examination question bank</article-title>
          <source>Medicine (Baltimore)</source>
          <year>2024</year>
          <month>03</month>
          <day>01</day>
          <volume>103</volume>
          <issue>9</issue>
          <fpage>e37325</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38428889"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/MD.0000000000037325</pub-id>
          <pub-id pub-id-type="medline">38428889</pub-id>
          <pub-id pub-id-type="pii">00005792-202403010-00048</pub-id>
          <pub-id pub-id-type="pmcid">PMC10906566</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Is</surname>
              <given-names>EE</given-names>
            </name>
            <name name-style="western">
              <surname>Menekseoglu</surname>
              <given-names>AK</given-names>
            </name>
          </person-group>
          <article-title>Comparative performance of artificial intelligence models in rheumatology board-level questions: evaluating Google Gemini and ChatGPT-4o</article-title>
          <source>Clin Rheumatol</source>
          <year>2024</year>
          <month>11</month>
          <day>28</day>
          <volume>43</volume>
          <issue>11</issue>
          <fpage>3507</fpage>
          <lpage>3513</lpage>
          <pub-id pub-id-type="doi">10.1007/s10067-024-07154-5</pub-id>
          <pub-id pub-id-type="medline">39340572</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10067-024-07154-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>D'Anna</surname>
              <given-names>Gennaro</given-names>
            </name>
            <name name-style="western">
              <surname>Van Cauter</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Thurnher</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Van Goethem</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Haller</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Can large language models pass official high-grade exams of the European Society of Neuroradiology courses? A direct comparison between OpenAI chatGPT 3.5, OpenAI GPT4 and Google Bard</article-title>
          <source>Neuroradiology</source>
          <year>2024</year>
          <month>08</month>
          <day>06</day>
          <volume>66</volume>
          <issue>8</issue>
          <fpage>1245</fpage>
          <lpage>1250</lpage>
          <pub-id pub-id-type="doi">10.1007/s00234-024-03371-6</pub-id>
          <pub-id pub-id-type="medline">38705899</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00234-024-03371-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Altamimi</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Alhumimidi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Alshehri</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Alrumayan</surname>
              <given-names>Abdullah</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Khlaiwi</surname>
              <given-names>Thamir</given-names>
            </name>
            <name name-style="western">
              <surname>Meo</surname>
              <given-names>Sultan A</given-names>
            </name>
            <name name-style="western">
              <surname>Temsah</surname>
              <given-names>Mohamad-Hani</given-names>
            </name>
          </person-group>
          <article-title>The scientific knowledge of three large language models in cardiology: multiple-choice questions examination-based performance</article-title>
          <source>Ann Med Surg (Lond)</source>
          <year>2024</year>
          <month>06</month>
          <volume>86</volume>
          <issue>6</issue>
          <fpage>3261</fpage>
          <lpage>3266</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38846858"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/MS9.0000000000002120</pub-id>
          <pub-id pub-id-type="medline">38846858</pub-id>
          <pub-id pub-id-type="pii">AMSU-D-23-02753</pub-id>
          <pub-id pub-id-type="pmcid">PMC11152788</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schoch</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schmelz</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Strauch</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Borgmann</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Nestler</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT-3.5 and ChatGPT-4 on the European Board of Urology (EBU) exams: a comparative analysis</article-title>
          <source>World J Urol</source>
          <year>2024</year>
          <month>07</month>
          <day>26</day>
          <volume>42</volume>
          <issue>1</issue>
          <fpage>445</fpage>
          <pub-id pub-id-type="doi">10.1007/s00345-024-05137-4</pub-id>
          <pub-id pub-id-type="medline">39060792</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00345-024-05137-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>May</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Körner-Riffard</surname>
              <given-names>Katharina</given-names>
            </name>
            <name name-style="western">
              <surname>Kollitsch</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Burger</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Brookman-May</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Rauchenwald</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Marszalek</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Eredics</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the efficacy of AI chatbots as tutors in urology: a comparative analysis of responses to the 2022 In-Service Assessment of the European Board of Urology</article-title>
          <source>Urol Int</source>
          <year>2024</year>
          <month>3</month>
          <day>30</day>
          <volume>108</volume>
          <issue>4</issue>
          <fpage>359</fpage>
          <lpage>366</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1159/000537854"/>
          </comment>
          <pub-id pub-id-type="doi">10.1159/000537854</pub-id>
          <pub-id pub-id-type="medline">38555637</pub-id>
          <pub-id pub-id-type="pii">000537854</pub-id>
          <pub-id pub-id-type="pmcid">PMC11305516</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sadeq</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Ghorab</surname>
              <given-names>RMF</given-names>
            </name>
            <name name-style="western">
              <surname>Ashry</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Abozaid</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Banihani</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Salem</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Aisheh</surname>
              <given-names>MTA</given-names>
            </name>
            <name name-style="western">
              <surname>Abuzahra</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mourid</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Assker</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Ayyad</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Moawad</surname>
              <given-names>MHED</given-names>
            </name>
          </person-group>
          <article-title>AI chatbots show promise but limitations on UK medical exam questions: a comparative performance study</article-title>
          <source>Sci Rep</source>
          <year>2024</year>
          <month>08</month>
          <day>14</day>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>18859</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-024-68996-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-024-68996-2</pub-id>
          <pub-id pub-id-type="medline">39143077</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-024-68996-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC11324724</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khalpey</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Abraham</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Khalpey</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Large language models take on cardiothoracic surgery: a comparative analysis of the performance of four models on American Board of Thoracic Surgery exam questions in 2023</article-title>
          <source>Cureus</source>
          <year>2024</year>
          <month>07</month>
          <volume>16</volume>
          <issue>7</issue>
          <fpage>e65083</fpage>
          <pub-id pub-id-type="doi">10.7759/cureus.65083</pub-id>
          <pub-id pub-id-type="medline">39171020</pub-id>
          <pub-id pub-id-type="pmcid">PMC11337141</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Fleischer</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Filip</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Eggerstedt</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hutz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Michaelides</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Batra</surname>
              <given-names>PS</given-names>
            </name>
            <name name-style="western">
              <surname>Tajudeen</surname>
              <given-names>BA</given-names>
            </name>
          </person-group>
          <article-title>Comparative performance of ChatGPT 3.5 and GPT4 on rhinology standardized board examination questions</article-title>
          <source>OTO Open</source>
          <year>2024</year>
          <month>06</month>
          <day>27</day>
          <volume>8</volume>
          <issue>2</issue>
          <fpage>e164</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38938507"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/oto2.164</pub-id>
          <pub-id pub-id-type="medline">38938507</pub-id>
          <pub-id pub-id-type="pii">OTO2164</pub-id>
          <pub-id pub-id-type="pmcid">PMC11208739</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Irmici</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cozzi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Della Pepa</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>De Berardinis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>D'Ascoli</surname>
              <given-names>Elisa</given-names>
            </name>
            <name name-style="western">
              <surname>Cellina</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cè</surname>
              <given-names>Maurizio</given-names>
            </name>
            <name name-style="western">
              <surname>Depretto</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Scaperrotta</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>How do large language models answer breast cancer quiz questions? A comparative study of GPT-3.5, GPT-4 and Google Gemini</article-title>
          <source>Radiol Med</source>
          <year>2024</year>
          <month>10</month>
          <day>13</day>
          <volume>129</volume>
          <issue>10</issue>
          <fpage>1463</fpage>
          <lpage>1467</lpage>
          <pub-id pub-id-type="doi">10.1007/s11547-024-01872-1</pub-id>
          <pub-id pub-id-type="medline">39138732</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11547-024-01872-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kollitsch</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Eredics</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Marszalek</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rauchenwald</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Brookman-May</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Burger</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Körner-Riffard</surname>
              <given-names>Katharina</given-names>
            </name>
            <name name-style="western">
              <surname>May</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>How does artificial intelligence master urological board examinations? A comparative analysis of different large language models' accuracy and reliability in the 2022 In-Service Assessment of the European Board of Urology</article-title>
          <source>World J Urol</source>
          <year>2024</year>
          <month>01</month>
          <day>10</day>
          <volume>42</volume>
          <issue>1</issue>
          <fpage>20</fpage>
          <pub-id pub-id-type="doi">10.1007/s00345-023-04749-6</pub-id>
          <pub-id pub-id-type="medline">38197996</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00345-023-04749-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Morreel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Verhoeven</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Mathysen</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Microsoft Bing outperforms five other generative artificial intelligence chatbots in the Antwerp University multiple choice medical license exam</article-title>
          <source>PLOS Digit Health</source>
          <year>2024</year>
          <month>02</month>
          <day>14</day>
          <volume>3</volume>
          <issue>2</issue>
          <fpage>e0000349</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38354127"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pdig.0000349</pub-id>
          <pub-id pub-id-type="medline">38354127</pub-id>
          <pub-id pub-id-type="pii">PDIG-D-23-00311</pub-id>
          <pub-id pub-id-type="pmcid">PMC10866461</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bajčetić</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mirčić</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rakočević</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Đoković</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Milutinović</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zaletel</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Comparing the performance of artificial intelligence learning models to medical students in solving histology and embryology multiple choice questions</article-title>
          <source>Ann Anat</source>
          <year>2024</year>
          <month>06</month>
          <volume>254</volume>
          <fpage>152261</fpage>
          <pub-id pub-id-type="doi">10.1016/j.aanat.2024.152261</pub-id>
          <pub-id pub-id-type="medline">38521363</pub-id>
          <pub-id pub-id-type="pii">S0940-9602(24)00053-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Canillas Del Rey</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Canillas Arias</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Exploring the potential of artificial intelligence in traumatology: conversational answers to specific questions</article-title>
          <source>Rev Esp Cir Ortop Traumatol</source>
          <year>2025</year>
          <month>01</month>
          <volume>69</volume>
          <issue>1</issue>
          <fpage>38</fpage>
          <lpage>46</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1888-4415(24)00086-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.recot.2024.05.004</pub-id>
          <pub-id pub-id-type="medline">38782358</pub-id>
          <pub-id pub-id-type="pii">S1888-4415(24)00086-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Riese</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Streichert</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Comparison of the performance of GPT-3.5 and GPT-4 with that of medical students on the written German Medical Licensing Examination: observational study</article-title>
          <source>JMIR Med Educ</source>
          <year>2024</year>
          <month>02</month>
          <day>08</day>
          <volume>10</volume>
          <fpage>e50965</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2024//e50965/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/50965</pub-id>
          <pub-id pub-id-type="medline">38329802</pub-id>
          <pub-id pub-id-type="pii">v10i1e50965</pub-id>
          <pub-id pub-id-type="pmcid">PMC10884900</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Toyama</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Harigai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Abe</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nagano</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kawabata</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Seki</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Takase</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Performance evaluation of ChatGPT, GPT-4, and Bard on the official board examination of the Japan Radiology Society</article-title>
          <source>Jpn J Radiol</source>
          <year>2024</year>
          <month>02</month>
          <day>04</day>
          <volume>42</volume>
          <issue>2</issue>
          <fpage>201</fpage>
          <lpage>207</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37792149"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11604-023-01491-2</pub-id>
          <pub-id pub-id-type="medline">37792149</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11604-023-01491-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC10811006</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Touma</surname>
              <given-names>NJ</given-names>
            </name>
            <name name-style="western">
              <surname>Caterini</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liblk</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Is ChatGPT ready for primetime? Performance of artificial intelligence on a simulated Canadian urology board exam</article-title>
          <source>Can Urol Assoc J</source>
          <year>2024</year>
          <month>10</month>
          <day>10</day>
          <volume>18</volume>
          <issue>10</issue>
          <fpage>329</fpage>
          <lpage>332</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.5489/cuaj.8800"/>
          </comment>
          <pub-id pub-id-type="doi">10.5489/cuaj.8800</pub-id>
          <pub-id pub-id-type="medline">38896484</pub-id>
          <pub-id pub-id-type="pii">cuaj.8800</pub-id>
          <pub-id pub-id-type="pmcid">PMC11477513</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Angelini</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>The performance of large language models in intercollegiate Membership of the Royal College of Surgeons examination</article-title>
          <source>Ann R Coll Surg Engl</source>
          <year>2024</year>
          <month>11</month>
          <day>06</day>
          <volume>106</volume>
          <issue>8</issue>
          <fpage>700</fpage>
          <lpage>704</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publishing.rcseng.ac.uk/doi/10.1308/rcsann.2024.0023?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1308/rcsann.2024.0023</pub-id>
          <pub-id pub-id-type="medline">38445611</pub-id>
          <pub-id pub-id-type="pmcid">PMC11528401</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Patil</surname>
              <given-names>NS</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>van der Pol</surname>
              <given-names>CB</given-names>
            </name>
            <name name-style="western">
              <surname>Larocque</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Comparative performance of ChatGPT and Bard in a text-based radiology knowledge assessment</article-title>
          <source>Can Assoc Radiol J</source>
          <year>2024</year>
          <month>05</month>
          <day>14</day>
          <volume>75</volume>
          <issue>2</issue>
          <fpage>344</fpage>
          <lpage>350</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/abs/10.1177/08465371231193716?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/08465371231193716</pub-id>
          <pub-id pub-id-type="medline">37578849</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hubany</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Scala</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Hashemi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kapoor</surname>
              <given-names>Saumya</given-names>
            </name>
            <name name-style="western">
              <surname>Fedorova</surname>
              <given-names>Julia R</given-names>
            </name>
            <name name-style="western">
              <surname>Vaccaro</surname>
              <given-names>Matthew J</given-names>
            </name>
            <name name-style="western">
              <surname>Ridout</surname>
              <given-names>Rees P</given-names>
            </name>
            <name name-style="western">
              <surname>Hedman</surname>
              <given-names>Casey C</given-names>
            </name>
            <name name-style="western">
              <surname>Kellogg</surname>
              <given-names>Brian C</given-names>
            </name>
            <name name-style="western">
              <surname>Leto Barone</surname>
              <given-names>Angelo A</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT-4 surpasses residents: a study of artificial intelligence competency in plastic surgery in-service examinations and its advancements from ChatGPT-3.5</article-title>
          <source>Plast Reconstr Surg Glob Open</source>
          <year>2024</year>
          <month>09</month>
          <volume>12</volume>
          <issue>9</issue>
          <fpage>e6136</fpage>
          <pub-id pub-id-type="doi">10.1097/GOX.0000000000006136</pub-id>
          <pub-id pub-id-type="medline">39239234</pub-id>
          <pub-id pub-id-type="pii">GOX-D-24-00262</pub-id>
          <pub-id pub-id-type="pmcid">PMC11377087</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nakajima</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Fujimori</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Furuya</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kanie</surname>
              <given-names>Yuya</given-names>
            </name>
            <name name-style="western">
              <surname>Imai</surname>
              <given-names>Hirotatsu</given-names>
            </name>
            <name name-style="western">
              <surname>Kita</surname>
              <given-names>Kosuke</given-names>
            </name>
            <name name-style="western">
              <surname>Uemura</surname>
              <given-names>Keisuke</given-names>
            </name>
            <name name-style="western">
              <surname>Okada</surname>
              <given-names>Seiji</given-names>
            </name>
          </person-group>
          <article-title>A comparison between GPT-3.5, GPT-4, and GPT-4V: can the large language model (ChatGPT) pass the Japanese Board of Orthopaedic Surgery examination?</article-title>
          <source>Cureus</source>
          <year>2024</year>
          <month>03</month>
          <volume>16</volume>
          <issue>3</issue>
          <fpage>e56402</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38633935"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.56402</pub-id>
          <pub-id pub-id-type="medline">38633935</pub-id>
          <pub-id pub-id-type="pmcid">PMC11023708</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thibaut</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Dabbagh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Liverneaux</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Does Google's Bard Chatbot perform better than ChatGPT on the European hand surgery exam?</article-title>
          <source>Int Orthop</source>
          <year>2024</year>
          <month>01</month>
          <day>15</day>
          <volume>48</volume>
          <issue>1</issue>
          <fpage>151</fpage>
          <lpage>158</lpage>
          <pub-id pub-id-type="doi">10.1007/s00264-023-06034-y</pub-id>
          <pub-id pub-id-type="medline">37968408</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00264-023-06034-y</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lum</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Dennison</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Guntupalli</surname>
              <given-names>Lohitha</given-names>
            </name>
            <name name-style="western">
              <surname>Choudhary</surname>
              <given-names>Soham</given-names>
            </name>
            <name name-style="western">
              <surname>Saiz</surname>
              <given-names>Augustine M</given-names>
            </name>
            <name name-style="western">
              <surname>Randall</surname>
              <given-names>Robert L</given-names>
            </name>
          </person-group>
          <article-title>Generative artificial intelligence performs at a second-year orthopedic resident level</article-title>
          <source>Cureus</source>
          <year>2024</year>
          <month>03</month>
          <volume>16</volume>
          <issue>3</issue>
          <fpage>e56104</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38618358"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.56104</pub-id>
          <pub-id pub-id-type="medline">38618358</pub-id>
          <pub-id pub-id-type="pmcid">PMC11014641</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Menekşeoğlu</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>İş</surname>
              <given-names>EE</given-names>
            </name>
          </person-group>
          <article-title>Comparative performance of artificial ıntelligence models in physical medicine and rehabilitation board-level questions</article-title>
          <source>Rev Assoc Med Bras (1992)</source>
          <year>2024</year>
          <volume>70</volume>
          <issue>7</issue>
          <fpage>e20240241</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.scielo.br/scielo.php?script=sci_arttext&amp;pid=S0104-42302024000700614&amp;lng=en&amp;nrm=iso&amp;tlng=en"/>
          </comment>
          <pub-id pub-id-type="doi">10.1590/1806-9282.20240241</pub-id>
          <pub-id pub-id-type="medline">39045939</pub-id>
          <pub-id pub-id-type="pii">S0104-42302024000700614</pub-id>
          <pub-id pub-id-type="pmcid">PMC11262310</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cheong</surname>
              <given-names>RCT</given-names>
            </name>
            <name name-style="western">
              <surname>Pang</surname>
              <given-names>KP</given-names>
            </name>
            <name name-style="western">
              <surname>Unadkat</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mcneillis</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Williamson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Joseph</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Randhawa</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Andrews</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Paleri</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Performance of artificial intelligence chatbots in sleep medicine certification board exams: ChatGPT versus Google Bard</article-title>
          <source>Eur Arch Otorhinolaryngol</source>
          <year>2024</year>
          <month>04</month>
          <volume>281</volume>
          <issue>4</issue>
          <fpage>2137</fpage>
          <lpage>2143</lpage>
          <pub-id pub-id-type="doi">10.1007/s00405-023-08381-3</pub-id>
          <pub-id pub-id-type="medline">38117307</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00405-023-08381-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mesnard</surname>
              <given-names>Benoît</given-names>
            </name>
            <name name-style="western">
              <surname>Schirmann</surname>
              <given-names>Aurélie</given-names>
            </name>
            <name name-style="western">
              <surname>Branchereau</surname>
              <given-names>Julien</given-names>
            </name>
            <name name-style="western">
              <surname>Perrot</surname>
              <given-names>Ophélie</given-names>
            </name>
            <name name-style="western">
              <surname>Bogaert</surname>
              <given-names>Guy</given-names>
            </name>
            <name name-style="western">
              <surname>Neuzillet</surname>
              <given-names>Yann</given-names>
            </name>
            <name name-style="western">
              <surname>Lebret</surname>
              <given-names>Thierry</given-names>
            </name>
            <name name-style="western">
              <surname>Madec</surname>
              <given-names>François-Xavier</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence: ready to pass the European Board examinations in urology?</article-title>
          <source>Eur Urol Open Sci</source>
          <year>2024</year>
          <month>02</month>
          <volume>60</volume>
          <fpage>44</fpage>
          <lpage>46</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2666-1683(24)00211-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.euros.2024.01.002</pub-id>
          <pub-id pub-id-type="medline">38321995</pub-id>
          <pub-id pub-id-type="pii">S2666-1683(24)00211-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC10845241</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ming</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Lei</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Influence of model evolution and system roles on ChatGPT's performance in Chinese medical licensing exams: comparative study</article-title>
          <source>JMIR Med Educ</source>
          <year>2024</year>
          <month>08</month>
          <day>13</day>
          <volume>10</volume>
          <fpage>e52784</fpage>
          <lpage>e52784</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2024//e52784/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/52784</pub-id>
          <pub-id pub-id-type="medline">39140269</pub-id>
          <pub-id pub-id-type="pii">v10i1e52784</pub-id>
          <pub-id pub-id-type="pmcid">PMC11336778</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chow</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hasan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Valdes</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Chhabra</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Raman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>JI</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Simone</surname>
              <given-names>CB</given-names>
            </name>
          </person-group>
          <article-title>The accuracy of artificial intelligence ChatGPT in oncology examination questions</article-title>
          <source>J Am Coll Radiol</source>
          <year>2024</year>
          <month>11</month>
          <volume>21</volume>
          <issue>11</issue>
          <fpage>1800</fpage>
          <lpage>1804</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1546-1440(24)00675-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jacr.2024.07.011</pub-id>
          <pub-id pub-id-type="medline">39098369</pub-id>
          <pub-id pub-id-type="pii">S1546-1440(24)00675-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Ro</surname>
              <given-names>DH</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT on solving orthopedic board-style questions: a comparative analysis of ChatGPT 3.5 and ChatGPT 4</article-title>
          <source>Clin Orthop Surg</source>
          <year>2024</year>
          <month>08</month>
          <volume>16</volume>
          <issue>4</issue>
          <fpage>669</fpage>
          <lpage>673</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ecios.org/DOIx.php?id=10.4055/cios23179"/>
          </comment>
          <pub-id pub-id-type="doi">10.4055/cios23179</pub-id>
          <pub-id pub-id-type="medline">39092297</pub-id>
          <pub-id pub-id-type="pmcid">PMC11262944</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Oura</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tatekawa</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Horiuchi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Matsushita</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Takita</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Atsukawa</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Mitsuyama</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yoshida</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Murai</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tanaka</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Shimono</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yamamoto</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Miki</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ueda</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Diagnostic accuracy of vision-language models on Japanese diagnostic radiology, nuclear medicine, and interventional radiology specialty board examinations</article-title>
          <source>Jpn J Radiol</source>
          <year>2024</year>
          <month>12</month>
          <day>20</day>
          <volume>42</volume>
          <issue>12</issue>
          <fpage>1392</fpage>
          <lpage>1398</lpage>
          <pub-id pub-id-type="doi">10.1007/s11604-024-01633-0</pub-id>
          <pub-id pub-id-type="medline">39031270</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11604-024-01633-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC11588758</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lewandowski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Łukowicz</surname>
              <given-names>Paweł</given-names>
            </name>
            <name name-style="western">
              <surname>Świetlik</surname>
              <given-names>Dariusz</given-names>
            </name>
            <name name-style="western">
              <surname>Barańska-Rybak</surname>
              <given-names>Wioletta</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT-3.5 and ChatGPT-4 dermatological knowledge level based on the Specialty Certificate Examination in Dermatology</article-title>
          <source>Clin Exp Dermatol</source>
          <year>2024</year>
          <month>06</month>
          <day>25</day>
          <volume>49</volume>
          <issue>7</issue>
          <fpage>686</fpage>
          <lpage>691</lpage>
          <pub-id pub-id-type="doi">10.1093/ced/llad255</pub-id>
          <pub-id pub-id-type="medline">37540015</pub-id>
          <pub-id pub-id-type="pii">7237242</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Knoedler</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Alfertshofer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Knoedler</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hoch</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Funk</surname>
              <given-names>PF</given-names>
            </name>
            <name name-style="western">
              <surname>Cotofana</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Maheta</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Frank</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Brébant</surname>
              <given-names>Vanessa</given-names>
            </name>
            <name name-style="western">
              <surname>Prantl</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lamby</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Pure wisdom or Potemkin villages? A comparison of ChatGPT 3.5 and ChatGPT 4 on USMLE Step 3 style questions: quantitative analysis</article-title>
          <source>JMIR Med Educ</source>
          <year>2024</year>
          <month>01</month>
          <day>05</day>
          <volume>10</volume>
          <fpage>e51148</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2024//e51148/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/51148</pub-id>
          <pub-id pub-id-type="medline">38180782</pub-id>
          <pub-id pub-id-type="pii">v10i1e51148</pub-id>
          <pub-id pub-id-type="pmcid">PMC10799278</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Yunus</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sohail</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rehman</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Saeed</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Jackson</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Sharkey</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mahmood</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Matyal</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence for anesthesiology board-style examination questions: role of large language models</article-title>
          <source>J Cardiothorac Vasc Anesth</source>
          <year>2024</year>
          <month>05</month>
          <volume>38</volume>
          <issue>5</issue>
          <fpage>1251</fpage>
          <lpage>1259</lpage>
          <pub-id pub-id-type="doi">10.1053/j.jvca.2024.01.032</pub-id>
          <pub-id pub-id-type="medline">38423884</pub-id>
          <pub-id pub-id-type="pii">S1053-0770(24)00090-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sheikh</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Thongprayoon</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Qureshi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Suppadungsuk</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kashani</surname>
              <given-names>KB</given-names>
            </name>
            <name name-style="western">
              <surname>Miao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Craici</surname>
              <given-names>IM</given-names>
            </name>
            <name name-style="western">
              <surname>Cheungpasitporn</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Personalized medicine transformed: ChatGPT's contribution to continuous renal replacement therapy alarm management in intensive care units</article-title>
          <source>J Pers Med</source>
          <year>2024</year>
          <month>02</month>
          <day>22</day>
          <volume>14</volume>
          <issue>3</issue>
          <fpage>233</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=jpm14030233"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/jpm14030233</pub-id>
          <pub-id pub-id-type="medline">38540976</pub-id>
          <pub-id pub-id-type="pii">jpm14030233</pub-id>
          <pub-id pub-id-type="pmcid">PMC10971480</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mayo-Yáñez</surname>
              <given-names>Miguel</given-names>
            </name>
            <name name-style="western">
              <surname>Lechien</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Maria-Saibene</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Vaira</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Maniaci</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chiesa-Estomba</surname>
              <given-names>CM</given-names>
            </name>
          </person-group>
          <article-title>Examining the performance of ChatGPT 3.5 and Microsoft Copilot in otolaryngology: a comparative study with otolaryngologists' evaluation</article-title>
          <source>Indian J Otolaryngol Head Neck Surg</source>
          <year>2024</year>
          <month>08</month>
          <day>01</day>
          <volume>76</volume>
          <issue>4</issue>
          <fpage>3465</fpage>
          <lpage>3469</lpage>
          <pub-id pub-id-type="doi">10.1007/s12070-024-04729-1</pub-id>
          <pub-id pub-id-type="medline">39130248</pub-id>
          <pub-id pub-id-type="pii">4729</pub-id>
          <pub-id pub-id-type="pmcid">PMC11306834</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rydzewski</surname>
              <given-names>NR</given-names>
            </name>
            <name name-style="western">
              <surname>Dinakaran</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Ruppin</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Turkbey</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Citrin</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>KR</given-names>
            </name>
          </person-group>
          <article-title>Comparative evaluation of LLMs in clinical oncology</article-title>
          <source>NEJM AI</source>
          <year>2024</year>
          <month>05</month>
          <day>25</day>
          <volume>1</volume>
          <issue>5</issue>
          <fpage>1</fpage>
          <pub-id pub-id-type="doi">10.1056/aioa2300151</pub-id>
          <pub-id pub-id-type="medline">39131700</pub-id>
          <pub-id pub-id-type="pmcid">PMC11315428</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Comparing ChatGPT and clinical nurses' performances on tracheostomy care: a cross-sectional study</article-title>
          <source>Int J Nurs Stud Adv</source>
          <year>2024</year>
          <month>06</month>
          <volume>6</volume>
          <fpage>100181</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2666-142X(24)00008-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijnsa.2024.100181</pub-id>
          <pub-id pub-id-type="medline">38746816</pub-id>
          <pub-id pub-id-type="pii">S2666-142X(24)00008-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC11080343</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Yi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Enhanced artificial intelligence strategies in renal oncology: iterative optimization and comparative analysis of GPT 3.5 versus 4.0</article-title>
          <source>Ann Surg Oncol</source>
          <year>2024</year>
          <month>06</month>
          <day>12</day>
          <volume>31</volume>
          <issue>6</issue>
          <fpage>3887</fpage>
          <lpage>3893</lpage>
          <pub-id pub-id-type="doi">10.1245/s10434-024-15107-0</pub-id>
          <pub-id pub-id-type="medline">38472675</pub-id>
          <pub-id pub-id-type="pii">10.1245/s10434-024-15107-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jaworski</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jasiński</surname>
              <given-names>Dawid</given-names>
            </name>
            <name name-style="western">
              <surname>Jaworski</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Hop</surname>
              <given-names>Aleksandra</given-names>
            </name>
            <name name-style="western">
              <surname>Janek</surname>
              <given-names>Artur</given-names>
            </name>
            <name name-style="western">
              <surname>Sławińska</surname>
              <given-names>Barbara</given-names>
            </name>
            <name name-style="western">
              <surname>Konieczniak</surname>
              <given-names>Lena</given-names>
            </name>
            <name name-style="western">
              <surname>Rzepka</surname>
              <given-names>Maciej</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>Maximilian</given-names>
            </name>
            <name name-style="western">
              <surname>Sysło</surname>
              <given-names>Oliwia</given-names>
            </name>
            <name name-style="western">
              <surname>Jarząbek</surname>
              <given-names>Victoria</given-names>
            </name>
            <name name-style="western">
              <surname>Błecha</surname>
              <given-names>Zuzanna</given-names>
            </name>
            <name name-style="western">
              <surname>Haraziński</surname>
              <given-names>Konrad</given-names>
            </name>
            <name name-style="western">
              <surname>Jasińska</surname>
              <given-names>Natalia</given-names>
            </name>
          </person-group>
          <article-title>Comparison of the performance of artificial intelligence versus medical professionals in the Polish final medical examination</article-title>
          <source>Cureus</source>
          <year>2024</year>
          <month>08</month>
          <volume>16</volume>
          <issue>8</issue>
          <fpage>e66011</fpage>
          <pub-id pub-id-type="doi">10.7759/cureus.66011</pub-id>
          <pub-id pub-id-type="medline">39221376</pub-id>
          <pub-id pub-id-type="pmcid">PMC11366403</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bharatha</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ojeh</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Fazle Rabbi</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Campbell</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Krishnamurthy</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Layne-Yarde</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Springer</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Connell</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Majumder</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Comparing the performance of ChatGPT-4 and medical students on MCQs at varied levels of Bloom’s taxonomy</article-title>
          <source>AMEP</source>
          <year>2024</year>
          <month>05</month>
          <volume>Volume 15</volume>
          <fpage>393</fpage>
          <lpage>400</lpage>
          <pub-id pub-id-type="doi">10.2147/amep.s457408</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Le</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT yields a passing score on a pediatric board preparatory exam but raises red flags</article-title>
          <source>Global Pediatric Health</source>
          <year>2024</year>
          <month>03</month>
          <day>24</day>
          <volume>11</volume>
          <fpage>1</fpage>
          <pub-id pub-id-type="doi">10.1177/2333794x241240327</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arango</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Flynn</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zeitlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lorenzana</surname>
              <given-names>Daniel J</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>Andrew J</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>Matthew S</given-names>
            </name>
            <name name-style="western">
              <surname>Strohl</surname>
              <given-names>Adam B</given-names>
            </name>
            <name name-style="western">
              <surname>Weiss</surname>
              <given-names>Lawrence E</given-names>
            </name>
            <name name-style="western">
              <surname>Weir</surname>
              <given-names>Tristan B</given-names>
            </name>
          </person-group>
          <article-title>The performance of ChatGPT on the American Society for Surgery of the Hand self-assessment examination</article-title>
          <source>Cureus</source>
          <year>2024</year>
          <month>04</month>
          <volume>16</volume>
          <issue>4</issue>
          <fpage>e58950</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38800302"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.58950</pub-id>
          <pub-id pub-id-type="medline">38800302</pub-id>
          <pub-id pub-id-type="pmcid">PMC11126365</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rojas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rojas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Burgess</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Toro-Pérez</surname>
              <given-names>Javier</given-names>
            </name>
            <name name-style="western">
              <surname>Salehi</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Exploring the performance of ChatGPT versions 3.5, 4, and 4 with vision in the Chilean medical licensing examination: observational study</article-title>
          <source>JMIR Med Educ</source>
          <year>2024</year>
          <month>04</month>
          <day>29</day>
          <volume>10</volume>
          <fpage>e55048</fpage>
          <lpage>e55048</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2024//e55048/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/55048</pub-id>
          <pub-id pub-id-type="medline">38686550</pub-id>
          <pub-id pub-id-type="pii">v10i1e55048</pub-id>
          <pub-id pub-id-type="pmcid">PMC11082432</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chau</surname>
              <given-names>RCW</given-names>
            </name>
            <name name-style="western">
              <surname>Thu</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>OY</given-names>
            </name>
            <name name-style="western">
              <surname>Hsung</surname>
              <given-names>RT</given-names>
            </name>
            <name name-style="western">
              <surname>Lo</surname>
              <given-names>ECM</given-names>
            </name>
            <name name-style="western">
              <surname>Lam</surname>
              <given-names>WYH</given-names>
            </name>
          </person-group>
          <article-title>Performance of generative artificial intelligence in dental licensing examinations</article-title>
          <source>Int Dent J</source>
          <year>2024</year>
          <month>06</month>
          <volume>74</volume>
          <issue>3</issue>
          <fpage>616</fpage>
          <lpage>621</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0020-6539(23)00989-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.identj.2023.12.007</pub-id>
          <pub-id pub-id-type="medline">38242810</pub-id>
          <pub-id pub-id-type="pii">S0020-6539(23)00989-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC11123518</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thirunavukarasu</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mahmood</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Malem</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Foster</surname>
              <given-names>WP</given-names>
            </name>
            <name name-style="western">
              <surname>Sanghera</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hassan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>SW</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>YL</given-names>
            </name>
            <name name-style="western">
              <surname>Chong</surname>
              <given-names>YJ</given-names>
            </name>
            <name name-style="western">
              <surname>Shakeel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>BKJ</given-names>
            </name>
            <name name-style="western">
              <surname>Jain</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>TF</given-names>
            </name>
            <name name-style="western">
              <surname>Rauz</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ting</surname>
              <given-names>DSW</given-names>
            </name>
            <name name-style="western">
              <surname>Ting</surname>
              <given-names>DSJ</given-names>
            </name>
          </person-group>
          <article-title>Large language models approach expert-level clinical knowledge and reasoning in ophthalmology: a head-to-head cross-sectional study</article-title>
          <source>PLOS Digit Health</source>
          <year>2024</year>
          <month>04</month>
          <day>17</day>
          <volume>3</volume>
          <issue>4</issue>
          <fpage>e0000341</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38630683"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pdig.0000341</pub-id>
          <pub-id pub-id-type="medline">38630683</pub-id>
          <pub-id pub-id-type="pii">PDIG-D-23-00293</pub-id>
          <pub-id pub-id-type="pmcid">PMC11023493</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref79">
        <label>79</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bicknell</surname>
              <given-names>BT</given-names>
            </name>
            <name name-style="western">
              <surname>Butler</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Whalen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ricks</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dixon</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Spaedy</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Skelton</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Edupuganti</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Dzubinski</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tate</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Dyess</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Lindeman</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lehmann</surname>
              <given-names>LS</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT-4 Omni performance in USMLE disciplines and clinical skills: comparative analysis</article-title>
          <source>JMIR Med Educ</source>
          <year>2024</year>
          <month>11</month>
          <day>06</day>
          <volume>10</volume>
          <fpage>e63430</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2024//e63430/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/63430</pub-id>
          <pub-id pub-id-type="medline">39504445</pub-id>
          <pub-id pub-id-type="pii">v10i1e63430</pub-id>
          <pub-id pub-id-type="pmcid">PMC11611793</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref80">
        <label>80</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haddad</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Saade</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT on ophthalmology-related questions across various examination levels: observational study</article-title>
          <source>JMIR Med Educ</source>
          <year>2024</year>
          <month>01</month>
          <day>18</day>
          <volume>10</volume>
          <fpage>e50842</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2024//e50842/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/50842</pub-id>
          <pub-id pub-id-type="medline">38236632</pub-id>
          <pub-id pub-id-type="pii">v10i1e50842</pub-id>
          <pub-id pub-id-type="pmcid">PMC10835593</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref81">
        <label>81</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Noda</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Izaki</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kitano</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Komatsu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ichikawa</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Shibagaki</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT and Bard in self-assessment questions for nephrology board renewal</article-title>
          <source>Clin Exp Nephrol</source>
          <year>2024</year>
          <month>05</month>
          <day>14</day>
          <volume>28</volume>
          <issue>5</issue>
          <fpage>465</fpage>
          <lpage>469</lpage>
          <pub-id pub-id-type="doi">10.1007/s10157-023-02451-w</pub-id>
          <pub-id pub-id-type="medline">38353783</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10157-023-02451-w</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref82">
        <label>82</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yudovich</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Makarova</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Hague</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Raman</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <article-title>Performance of GPT-3.5 and GPT-4 on standardized urology knowledge assessment items in the United States: a descriptive study</article-title>
          <source>J Educ Eval Health Prof</source>
          <year>2024</year>
          <month>07</month>
          <day>08</day>
          <volume>21</volume>
          <fpage>17</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.doi.org/10.3352/jeehp.2024.21.17"/>
          </comment>
          <pub-id pub-id-type="doi">10.3352/jeehp.2024.21.17</pub-id>
          <pub-id pub-id-type="medline">38977032</pub-id>
          <pub-id pub-id-type="pii">jeehp.2024.21.17</pub-id>
          <pub-id pub-id-type="pmcid">PMC11893186</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref83">
        <label>83</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tsai</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yeh</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hsu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hsu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Su</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Comparing the performance of ChatGPT GPT-4, Bard, and Llama-2 in the Taiwan Psychiatric Licensing Examination and in differential diagnosis with multi-center psychiatrists</article-title>
          <source>Psychiatry Clin Neurosci</source>
          <year>2024</year>
          <month>06</month>
          <day>26</day>
          <volume>78</volume>
          <issue>6</issue>
          <fpage>347</fpage>
          <lpage>352</lpage>
          <pub-id pub-id-type="doi">10.1111/pcn.13656</pub-id>
          <pub-id pub-id-type="medline">38404249</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref84">
        <label>84</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Farhat</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Chaudhry</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Nadeem</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sohail</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Madsen</surname>
              <given-names>D?</given-names>
            </name>
          </person-group>
          <article-title>Evaluating large language models for the National Premedical Exam in India: comparative analysis of GPT-3.5, GPT-4, and Bard</article-title>
          <source>JMIR Med Educ</source>
          <year>2024</year>
          <month>02</month>
          <day>21</day>
          <volume>10</volume>
          <fpage>e51523</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2024//e51523/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/51523</pub-id>
          <pub-id pub-id-type="medline">38381486</pub-id>
          <pub-id pub-id-type="pii">v10i1e51523</pub-id>
          <pub-id pub-id-type="pmcid">PMC10918540</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref85">
        <label>85</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gilson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Safranek</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Socrates</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Chi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Chartash</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>How does ChatGPT perform on the United States Medical Licensing Examination (USMLE)? The implications of large language models for medical education and knowledge assessment</article-title>
          <source>JMIR Med Educ</source>
          <year>2023</year>
          <month>02</month>
          <day>08</day>
          <volume>9</volume>
          <fpage>e45312</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2023//e45312/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/45312</pub-id>
          <pub-id pub-id-type="medline">36753318</pub-id>
          <pub-id pub-id-type="pii">v9i1e45312</pub-id>
          <pub-id pub-id-type="pmcid">PMC9947764</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref86">
        <label>86</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kung</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Marshall</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gauthier</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzalez</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Jackson</surname>
              <given-names>JB</given-names>
            </name>
          </person-group>
          <article-title>Evaluating ChatGPT performance on the orthopaedic in-training examination</article-title>
          <source>JB JS Open Access</source>
          <year>2023</year>
          <volume>8</volume>
          <issue>3</issue>
          <fpage>1</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37693092"/>
          </comment>
          <pub-id pub-id-type="doi">10.2106/JBJS.OA.23.00056</pub-id>
          <pub-id pub-id-type="medline">37693092</pub-id>
          <pub-id pub-id-type="pii">JBJSOA-D-23-00056</pub-id>
          <pub-id pub-id-type="pmcid">PMC10484364</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref87">
        <label>87</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gencer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Aydin</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Can ChatGPT pass the thoracic surgery exam?</article-title>
          <source>Am J Med Sci</source>
          <year>2023</year>
          <month>10</month>
          <volume>366</volume>
          <issue>4</issue>
          <fpage>291</fpage>
          <lpage>295</lpage>
          <pub-id pub-id-type="doi">10.1016/j.amjms.2023.08.001</pub-id>
          <pub-id pub-id-type="medline">37549788</pub-id>
          <pub-id pub-id-type="pii">S0002-9629(23)01292-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref88">
        <label>88</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>OY</given-names>
            </name>
            <name name-style="western">
              <surname>Connolly</surname>
              <given-names>ID</given-names>
            </name>
            <name name-style="western">
              <surname>Zadnik Sullivan</surname>
              <given-names>PL</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Fridley</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Asaad</surname>
              <given-names>WF</given-names>
            </name>
            <name name-style="western">
              <surname>Cielo</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Oyelese</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Doberstein</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Gokaslan</surname>
              <given-names>ZL</given-names>
            </name>
            <name name-style="western">
              <surname>Telfeian</surname>
              <given-names>AE</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT and GPT-4 on neurosurgery written board examinations</article-title>
          <source>Neurosurgery</source>
          <year>2023</year>
          <month>12</month>
          <day>01</day>
          <volume>93</volume>
          <issue>6</issue>
          <fpage>1353</fpage>
          <lpage>1365</lpage>
          <pub-id pub-id-type="doi">10.1227/neu.0000000000002632</pub-id>
          <pub-id pub-id-type="medline">37581444</pub-id>
          <pub-id pub-id-type="pii">00006123-202312000-00018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref89">
        <label>89</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Massey</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Montgomery</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>AS</given-names>
            </name>
          </person-group>
          <article-title>Comparison of ChatGPT-3.5, ChatGPT-4, and orthopaedic resident performance on orthopaedic assessment examinations</article-title>
          <source>J Am Acad Orthop Surg</source>
          <year>2023</year>
          <month>12</month>
          <day>01</day>
          <volume>31</volume>
          <issue>23</issue>
          <fpage>1173</fpage>
          <lpage>1179</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37671415"/>
          </comment>
          <pub-id pub-id-type="doi">10.5435/JAAOS-D-23-00396</pub-id>
          <pub-id pub-id-type="medline">37671415</pub-id>
          <pub-id pub-id-type="pii">00124635-990000000-00782</pub-id>
          <pub-id pub-id-type="pmcid">PMC10627532</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref90">
        <label>90</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Suchman</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Garg</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Trindade</surname>
              <given-names>AJ</given-names>
            </name>
          </person-group>
          <article-title>Chat Generative Pretrained Transformer fails the multiple-choice American College of Gastroenterology self-assessment test</article-title>
          <source>Am J Gastroenterol</source>
          <year>2023</year>
          <month>12</month>
          <day>01</day>
          <volume>118</volume>
          <issue>12</issue>
          <fpage>2280</fpage>
          <lpage>2282</lpage>
          <pub-id pub-id-type="doi">10.14309/ajg.0000000000002320</pub-id>
          <pub-id pub-id-type="medline">37212584</pub-id>
          <pub-id pub-id-type="pii">00000434-202312000-00032</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref91">
        <label>91</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sakai</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Maeda</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ozaki</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kanda</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kurimoto</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Takahashi</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT in board examinations for specialists in the Japanese Ophthalmology Society</article-title>
          <source>Cureus</source>
          <year>2023</year>
          <month>12</month>
          <volume>15</volume>
          <issue>12</issue>
          <fpage>e49903</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38174202"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.49903</pub-id>
          <pub-id pub-id-type="medline">38174202</pub-id>
          <pub-id pub-id-type="pmcid">PMC10763518</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref92">
        <label>92</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Gomaa</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Semrau</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Haderlein</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lettmaier</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Weissmann</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Grigo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tkhayat</surname>
              <given-names>HB</given-names>
            </name>
            <name name-style="western">
              <surname>Frey</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Gaipl</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Distel</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Maier</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fietkau</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bert</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Putz</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Benchmarking ChatGPT-4 on a radiation oncology in-training exam and Red Journal Gray Zone cases: potentials and challenges for AI-assisted medical education and decision making in radiation oncology</article-title>
          <source>Front Oncol</source>
          <year>2023</year>
          <volume>13</volume>
          <fpage>1265024</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37790756"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fonc.2023.1265024</pub-id>
          <pub-id pub-id-type="medline">37790756</pub-id>
          <pub-id pub-id-type="pmcid">PMC10543650</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref93">
        <label>93</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yanagita</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yokokawa</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Uchida</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tawara</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ikusaka</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Accuracy of ChatGPT on medical questions in the National Medical Licensing Examination in Japan: evaluation study</article-title>
          <source>JMIR Form Res</source>
          <year>2023</year>
          <month>10</month>
          <day>13</day>
          <volume>7</volume>
          <fpage>e48023</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://formative.jmir.org/2023//e48023/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/48023</pub-id>
          <pub-id pub-id-type="medline">37831496</pub-id>
          <pub-id pub-id-type="pii">v7i1e48023</pub-id>
          <pub-id pub-id-type="pmcid">PMC10612006</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref94">
        <label>94</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Teebagy</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Colwell</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wood</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Yaghy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Faustina</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Improved performance of ChatGPT-4 on the OKAP Examination: a comparative study with ChatGPT-3.5</article-title>
          <source>J Acad Ophthalmol (2017)</source>
          <year>2023</year>
          <month>07</month>
          <day>11</day>
          <volume>15</volume>
          <issue>2</issue>
          <fpage>e184</fpage>
          <lpage>e187</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.thieme-connect.com/DOI/DOI?10.1055/s-0043-1774399"/>
          </comment>
          <pub-id pub-id-type="doi">10.1055/s-0043-1774399</pub-id>
          <pub-id pub-id-type="medline">37701862</pub-id>
          <pub-id pub-id-type="pii">JAO-425</pub-id>
          <pub-id pub-id-type="pmcid">PMC10495224</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref95">
        <label>95</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kaneda</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Takahashi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kaneda</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Akashima</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Okita</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Misaki</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yamashiro</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ozaki</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tanimoto</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Assessing the performance of GPT-3.5 and GPT-4 on the 2023 Japanese Nursing Examination</article-title>
          <source>Cureus</source>
          <year>2023</year>
          <month>08</month>
          <volume>15</volume>
          <issue>8</issue>
          <fpage>e42924</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37667724"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.42924</pub-id>
          <pub-id pub-id-type="medline">37667724</pub-id>
          <pub-id pub-id-type="pmcid">PMC10475149</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref96">
        <label>96</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Flores-Cohaila</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>García-Vicente</surname>
              <given-names>Abigaíl</given-names>
            </name>
            <name name-style="western">
              <surname>Vizcarra-Jiménez</surname>
              <given-names>Sonia F</given-names>
            </name>
            <name name-style="western">
              <surname>De la Cruz-Galán</surname>
              <given-names>Janith P</given-names>
            </name>
            <name name-style="western">
              <surname>Gutiérrez-Arratia</surname>
              <given-names>Jesús D</given-names>
            </name>
            <name name-style="western">
              <surname>Quiroga Torres</surname>
              <given-names>BG</given-names>
            </name>
            <name name-style="western">
              <surname>Taype-Rondan</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT on the Peruvian National Licensing Medical Examination: cross-sectional study</article-title>
          <source>JMIR Med Educ</source>
          <year>2023</year>
          <month>09</month>
          <day>28</day>
          <volume>9</volume>
          <fpage>e48039</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2023//e48039/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/48039</pub-id>
          <pub-id pub-id-type="medline">37768724</pub-id>
          <pub-id pub-id-type="pii">v9i1e48039</pub-id>
          <pub-id pub-id-type="pmcid">PMC10570896</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref97">
        <label>97</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fowler</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Pullen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Birkett</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT and Bard on the official part 1 FRCOphth practice questions</article-title>
          <source>Br J Ophthalmol</source>
          <year>2024</year>
          <month>09</month>
          <day>20</day>
          <volume>108</volume>
          <issue>10</issue>
          <fpage>1379</fpage>
          <lpage>1383</lpage>
          <pub-id pub-id-type="doi">10.1136/bjo-2023-324091</pub-id>
          <pub-id pub-id-type="medline">37932006</pub-id>
          <pub-id pub-id-type="pii">bjo-2023-324091</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref98">
        <label>98</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moshirfar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Altaf</surname>
              <given-names>AW</given-names>
            </name>
            <name name-style="western">
              <surname>Stoakes</surname>
              <given-names>IM</given-names>
            </name>
            <name name-style="western">
              <surname>Tuttle</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hoopes</surname>
              <given-names>PC</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence in ophthalmology: a comparative analysis of GPT-3.5, GPT-4, and human expertise in answering StatPearls questions</article-title>
          <source>Cureus</source>
          <year>2023</year>
          <month>06</month>
          <volume>15</volume>
          <issue>6</issue>
          <fpage>e40822</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37485215"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.40822</pub-id>
          <pub-id pub-id-type="medline">37485215</pub-id>
          <pub-id pub-id-type="pmcid">PMC10362981</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref99">
        <label>99</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sorin</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Vaid</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Soroush</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Glicksberg</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Charney</surname>
              <given-names>AW</given-names>
            </name>
            <name name-style="western">
              <surname>Nadkarni</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Klang</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Comparing ChatGPT and GPT-4 performance in USMLE soft skill assessments</article-title>
          <source>Sci Rep</source>
          <year>2023</year>
          <month>10</month>
          <day>01</day>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>16492</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-023-43436-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-023-43436-9</pub-id>
          <pub-id pub-id-type="medline">37779171</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-023-43436-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC10543445</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref100">
        <label>100</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Miao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Thongprayoon</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Garcia Valencia</surname>
              <given-names>OA</given-names>
            </name>
            <name name-style="western">
              <surname>Krisanapan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sheikh</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>PW</given-names>
            </name>
            <name name-style="western">
              <surname>Mekraksakit</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Suarez</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Craici</surname>
              <given-names>IM</given-names>
            </name>
            <name name-style="western">
              <surname>Cheungpasitporn</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT on nephrology test questions</article-title>
          <source>CJASN</source>
          <year>2023</year>
          <month>10</month>
          <day>18</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>35</fpage>
          <lpage>43</lpage>
          <pub-id pub-id-type="doi">10.2215/cjn.0000000000000330</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref101">
        <label>101</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kaneda</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Namba</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kaneda</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Tanimoto</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence in childcare: assessing the performance and acceptance of ChatGPT responses</article-title>
          <source>Cureus</source>
          <year>2023</year>
          <month>08</month>
          <volume>15</volume>
          <issue>8</issue>
          <fpage>e44484</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37791148"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.44484</pub-id>
          <pub-id pub-id-type="medline">37791148</pub-id>
          <pub-id pub-id-type="pmcid">PMC10544433</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref102">
        <label>102</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Takagi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Watari</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Erabi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sakaguchi</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Performance of GPT-3.5 and GPT-4 on the Japanese Medical Licensing Examination: comparison study</article-title>
          <source>JMIR Med Educ</source>
          <year>2023</year>
          <month>06</month>
          <day>29</day>
          <volume>9</volume>
          <fpage>e48002</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2023//e48002/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/48002</pub-id>
          <pub-id pub-id-type="medline">37384388</pub-id>
          <pub-id pub-id-type="pii">v9i1e48002</pub-id>
          <pub-id pub-id-type="pmcid">PMC10365615</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref103">
        <label>103</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>OY</given-names>
            </name>
            <name name-style="western">
              <surname>Connolly</surname>
              <given-names>ID</given-names>
            </name>
            <name name-style="western">
              <surname>Fridley</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Zadnik Sullivan</surname>
              <given-names>PL</given-names>
            </name>
            <name name-style="western">
              <surname>Cielo</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Oyelese</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Doberstein</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Telfeian</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Gokaslan</surname>
              <given-names>ZL</given-names>
            </name>
            <name name-style="western">
              <surname>Asaad</surname>
              <given-names>WF</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT, GPT-4, and Google Bard on a neurosurgery oral boards preparation question bank</article-title>
          <source>Neurosurgery</source>
          <year>2023</year>
          <month>11</month>
          <day>01</day>
          <volume>93</volume>
          <issue>5</issue>
          <fpage>1090</fpage>
          <lpage>1098</lpage>
          <pub-id pub-id-type="doi">10.1227/neu.0000000000002551</pub-id>
          <pub-id pub-id-type="medline">37306460</pub-id>
          <pub-id pub-id-type="pii">00006123-990000000-00775</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref104">
        <label>104</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ohta</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ohta</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>The Performance of GPT-3.5, GPT-4, and Bard on the Japanese National Dentist Examination: a comparison study</article-title>
          <source>Cureus</source>
          <year>2023</year>
          <month>12</month>
          <volume>15</volume>
          <issue>12</issue>
          <fpage>e50369</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38213361"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.50369</pub-id>
          <pub-id pub-id-type="medline">38213361</pub-id>
          <pub-id pub-id-type="pmcid">PMC10782219</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref105">
        <label>105</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Watari</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Takagi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sakaguchi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nishizaki</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shimizu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yamamoto</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tokuda</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Performance comparison of ChatGPT-4 and Japanese medical residents in the General Medicine In-Training Examination: comparison study</article-title>
          <source>JMIR Med Educ</source>
          <year>2023</year>
          <month>12</month>
          <day>06</day>
          <volume>9</volume>
          <fpage>e52202</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2023//e52202/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/52202</pub-id>
          <pub-id pub-id-type="medline">38055323</pub-id>
          <pub-id pub-id-type="pii">v9i1e52202</pub-id>
          <pub-id pub-id-type="pmcid">PMC10733815</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref106">
        <label>106</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Roos</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kasapovic</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jansen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kaczmarczyk</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence in medical education: comparative analysis of ChatGPT, Bing, and medical students in Germany</article-title>
          <source>JMIR Med Educ</source>
          <year>2023</year>
          <month>09</month>
          <day>04</day>
          <volume>9</volume>
          <fpage>e46482</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2023//e46482/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/46482</pub-id>
          <pub-id pub-id-type="medline">37665620</pub-id>
          <pub-id pub-id-type="pii">v9i1e46482</pub-id>
          <pub-id pub-id-type="pmcid">PMC10507517</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref107">
        <label>107</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guillen-Grima</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Guillen-Aguinaga</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Guillen-Aguinaga</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Alas-Brun</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Onambele</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ortega</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Montejo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Aguinaga-Ontoso</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Barach</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Aguinaga-Ontoso</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the efficacy of ChatGPT in navigating the Spanish Medical Residency Entrance Examination (MIR): promising horizons for AI in clinical medicine</article-title>
          <source>Clin Pract</source>
          <year>2023</year>
          <month>11</month>
          <day>20</day>
          <volume>13</volume>
          <issue>6</issue>
          <fpage>1460</fpage>
          <lpage>1487</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=clinpract13060130"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/clinpract13060130</pub-id>
          <pub-id pub-id-type="medline">37987431</pub-id>
          <pub-id pub-id-type="pii">clinpract13060130</pub-id>
          <pub-id pub-id-type="pmcid">PMC10660543</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref108">
        <label>108</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>KJQ</given-names>
            </name>
            <name name-style="western">
              <surname>Meaney</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kemppainen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Punnett</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Leung</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Assessment of resident and AI chatbot performance on the University of Toronto family medicine residency progress test: comparative study</article-title>
          <source>JMIR Med Educ</source>
          <year>2023</year>
          <month>09</month>
          <day>19</day>
          <volume>9</volume>
          <fpage>e50514</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2023//e50514/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/50514</pub-id>
          <pub-id pub-id-type="medline">37725411</pub-id>
          <pub-id pub-id-type="pii">v9i1e50514</pub-id>
          <pub-id pub-id-type="pmcid">PMC10548315</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref109">
        <label>109</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schubert</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Wick</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Venkataramani</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Performance of large language models on a neurology board-style examination</article-title>
          <source>JAMA Netw Open</source>
          <year>2023</year>
          <month>12</month>
          <day>01</day>
          <volume>6</volume>
          <issue>12</issue>
          <fpage>e2346721</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38060223"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2023.46721</pub-id>
          <pub-id pub-id-type="medline">38060223</pub-id>
          <pub-id pub-id-type="pii">2812620</pub-id>
          <pub-id pub-id-type="pmcid">PMC10704278</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref110">
        <label>110</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Torres-Zegarra</surname>
              <given-names>BC</given-names>
            </name>
            <name name-style="western">
              <surname>Rios-Garcia</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ñaña-Cordova</surname>
              <given-names>Alvaro Micael</given-names>
            </name>
            <name name-style="western">
              <surname>Arteaga-Cisneros</surname>
              <given-names>KF</given-names>
            </name>
            <name name-style="western">
              <surname>Chalco</surname>
              <given-names>XCB</given-names>
            </name>
            <name name-style="western">
              <surname>Ordoñez</surname>
              <given-names>Marina Atena Bustamante</given-names>
            </name>
            <name name-style="western">
              <surname>Rios</surname>
              <given-names>CJG</given-names>
            </name>
            <name name-style="western">
              <surname>Godoy</surname>
              <given-names>CAR</given-names>
            </name>
            <name name-style="western">
              <surname>Quezada</surname>
              <given-names>KLTP</given-names>
            </name>
            <name name-style="western">
              <surname>Gutierrez-Arratia</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Flores-Cohaila</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT, Bard, Claude, and Bing on the Peruvian National Licensing Medical Examination: a cross-sectional study</article-title>
          <source>J Educ Eval Health Prof</source>
          <year>2023</year>
          <month>11</month>
          <day>20</day>
          <volume>20</volume>
          <fpage>30</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37981579"/>
          </comment>
          <pub-id pub-id-type="doi">10.3352/jeehp.2023.20.30</pub-id>
          <pub-id pub-id-type="medline">37981579</pub-id>
          <pub-id pub-id-type="pii">jeehp.2023.20.30</pub-id>
          <pub-id pub-id-type="pmcid">PMC11009012</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref111">
        <label>111</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kirshteyn</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Golan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Chaet</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT vs. HuggingChat on OB-GYN topics</article-title>
          <source>Cureus</source>
          <year>2024</year>
          <month>03</month>
          <volume>16</volume>
          <issue>3</issue>
          <fpage>e56187</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38618446"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.56187</pub-id>
          <pub-id pub-id-type="medline">38618446</pub-id>
          <pub-id pub-id-type="pmcid">PMC11015885</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref112">
        <label>112</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van Nuland</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Erdogan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Aςar</surname>
              <given-names>Cenkay</given-names>
            </name>
            <name name-style="western">
              <surname>Contrucci</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hilbrants</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Maanach</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Egberts</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>van der Linden</surname>
              <given-names>PD</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT on factual knowledge questions regarding clinical pharmacy</article-title>
          <source>J Clin Pharmacol</source>
          <year>2024</year>
          <month>09</month>
          <day>16</day>
          <volume>64</volume>
          <issue>9</issue>
          <fpage>1095</fpage>
          <lpage>1100</lpage>
          <pub-id pub-id-type="doi">10.1002/jcph.2443</pub-id>
          <pub-id pub-id-type="medline">38623909</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref113">
        <label>113</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Danesh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pazouki</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Danesh</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Danesh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Vardar‐Sengul</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence in dental education: ChatGPT's performance on the periodontic in‐service examination</article-title>
          <source>Journal of Periodontology</source>
          <year>2024</year>
          <month>01</month>
          <day>10</day>
          <volume>95</volume>
          <issue>7</issue>
          <fpage>682</fpage>
          <lpage>687</lpage>
          <pub-id pub-id-type="doi">10.1002/jper.23-0514</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref114">
        <label>114</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>CY</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Caussade</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Stockton Hogrogian</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>AC</given-names>
            </name>
          </person-group>
          <article-title>Pediatric dermatologists versus AI bots: evaluating the medical knowledge and diagnostic capabilities of ChatGPT</article-title>
          <source>Pediatr Dermatol</source>
          <year>2024</year>
          <month>05</month>
          <day>09</day>
          <volume>41</volume>
          <issue>5</issue>
          <fpage>831</fpage>
          <lpage>834</lpage>
          <pub-id pub-id-type="doi">10.1111/pde.15649</pub-id>
          <pub-id pub-id-type="medline">38721744</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref115">
        <label>115</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fiedler</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Azua</surname>
              <given-names>EN</given-names>
            </name>
            <name name-style="western">
              <surname>Phillips</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>AS</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT performance on the American Shoulder and Elbow Surgeons maintenance of certification exam</article-title>
          <source>J Shoulder Elbow Surg</source>
          <year>2024</year>
          <month>09</month>
          <volume>33</volume>
          <issue>9</issue>
          <fpage>1888</fpage>
          <lpage>1893</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jse.2024.02.029</pub-id>
          <pub-id pub-id-type="medline">38580067</pub-id>
          <pub-id pub-id-type="pii">S1058-2746(24)00231-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref116">
        <label>116</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Coleman</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>JN</given-names>
            </name>
          </person-group>
          <article-title>Two artificial intelligence models underperform on examinations in a veterinary curriculum</article-title>
          <source>J Am Vet Med Assoc</source>
          <year>2024</year>
          <month>05</month>
          <day>01</day>
          <volume>262</volume>
          <issue>5</issue>
          <fpage>692</fpage>
          <lpage>697</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://avmajournals.avma.org/doi/10.2460/javma.23.12.0666"/>
          </comment>
          <pub-id pub-id-type="doi">10.2460/javma.23.12.0666</pub-id>
          <pub-id pub-id-type="medline">38382193</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref117">
        <label>117</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abbas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rehman</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Rehman</surname>
              <given-names>SS</given-names>
            </name>
          </person-group>
          <article-title>Comparing the performance of popular large language models on the National Board of Medical Examiners sample questions</article-title>
          <source>Cureus</source>
          <year>2024</year>
          <month>03</month>
          <volume>16</volume>
          <issue>3</issue>
          <fpage>e55991</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38606229"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.55991</pub-id>
          <pub-id pub-id-type="medline">38606229</pub-id>
          <pub-id pub-id-type="pmcid">PMC11007479</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref118">
        <label>118</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jarou</surname>
              <given-names>ZJ</given-names>
            </name>
            <name name-style="western">
              <surname>Dakka</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>McGuire</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bunting</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT versus human performance on emergency medicine board preparation questions</article-title>
          <source>Ann Emerg Med</source>
          <year>2024</year>
          <month>01</month>
          <volume>83</volume>
          <issue>1</issue>
          <fpage>87</fpage>
          <lpage>88</lpage>
          <pub-id pub-id-type="doi">10.1016/j.annemergmed.2023.08.010</pub-id>
          <pub-id pub-id-type="medline">37725017</pub-id>
          <pub-id pub-id-type="pii">S0196-0644(23)00663-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref119">
        <label>119</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sensoy</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Citirik</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Assessing the proficiency of artificial intelligence programs in the diagnosis and treatment of cornea, conjunctiva, and eyelid diseases and exploring the advantages of each other benefits</article-title>
          <source>Cont Lens Anterior Eye</source>
          <year>2024</year>
          <month>04</month>
          <volume>47</volume>
          <issue>2</issue>
          <fpage>102125</fpage>
          <pub-id pub-id-type="doi">10.1016/j.clae.2024.102125</pub-id>
          <pub-id pub-id-type="medline">38443209</pub-id>
          <pub-id pub-id-type="pii">S1367-0484(24)00008-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref120">
        <label>120</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guerra</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Hofmann</surname>
              <given-names>HL</given-names>
            </name>
            <name name-style="western">
              <surname>Le</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Fathi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mayfield</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Petrigliano</surname>
              <given-names>FA</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>JN</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT, Bard, and Bing chat are large language processing models that answered orthopaedic in-training examination questions with similar accuracy to first-year orthopaedic surgery residents</article-title>
          <source>Arthroscopy</source>
          <year>2025</year>
          <month>03</month>
          <volume>41</volume>
          <issue>3</issue>
          <fpage>557</fpage>
          <lpage>562</lpage>
          <pub-id pub-id-type="doi">10.1016/j.arthro.2024.08.023</pub-id>
          <pub-id pub-id-type="medline">39209078</pub-id>
          <pub-id pub-id-type="pii">S0749-8063(24)00621-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref121">
        <label>121</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Agarwal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Goswami</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>Priyanka</given-names>
            </name>
          </person-group>
          <article-title>Evaluating ChatGPT-3.5 and Claude-2 in answering and explaining conceptual medical physiology multiple-choice questions</article-title>
          <source>Cureus</source>
          <year>2023</year>
          <month>09</month>
          <volume>15</volume>
          <issue>9</issue>
          <fpage>e46222</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37908959"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.46222</pub-id>
          <pub-id pub-id-type="medline">37908959</pub-id>
          <pub-id pub-id-type="pmcid">PMC10613833</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref122">
        <label>122</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cheong</surname>
              <given-names>KX</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fenner</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>WM</given-names>
            </name>
            <name name-style="western">
              <surname>Teo</surname>
              <given-names>KY</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>YX</given-names>
            </name>
            <name name-style="western">
              <surname>Sivaprasad</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Keane</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>AY</given-names>
            </name>
            <name name-style="western">
              <surname>Cheung</surname>
              <given-names>CMG</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>TY</given-names>
            </name>
            <name name-style="western">
              <surname>Cheong</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Tham</surname>
              <given-names>YC</given-names>
            </name>
          </person-group>
          <article-title>Comparing generative and retrieval-based chatbots in answering patient questions regarding age-related macular degeneration and diabetic retinopathy</article-title>
          <source>Br J Ophthalmol</source>
          <year>2024</year>
          <month>09</month>
          <day>20</day>
          <volume>108</volume>
          <issue>10</issue>
          <fpage>1443</fpage>
          <lpage>1449</lpage>
          <pub-id pub-id-type="doi">10.1136/bjo-2023-324533</pub-id>
          <pub-id pub-id-type="medline">38749531</pub-id>
          <pub-id pub-id-type="pii">bjo-2023-324533</pub-id>
          <pub-id pub-id-type="pmcid">PMC11716104</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref123">
        <label>123</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>Hong</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Chun</given-names>
            </name>
            <name name-style="western">
              <surname>Ran</surname>
              <given-names>Guanghui</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>Juan</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>Chengliang</given-names>
            </name>
          </person-group>
          <article-title>The performance of large language model-powered chatbots compared to oncology physicians on colorectal cancer queries</article-title>
          <source>Int J Surg</source>
          <year>2024</year>
          <month>10</month>
          <day>01</day>
          <volume>110</volume>
          <issue>10</issue>
          <fpage>6509</fpage>
          <lpage>6517</lpage>
          <pub-id pub-id-type="doi">10.1097/JS9.0000000000001850</pub-id>
          <pub-id pub-id-type="medline">38935100</pub-id>
          <pub-id pub-id-type="pii">01279778-990000000-01734</pub-id>
          <pub-id pub-id-type="pmcid">PMC11487020</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref124">
        <label>124</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kozaily</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Geagea</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Akdogan</surname>
              <given-names>ER</given-names>
            </name>
            <name name-style="western">
              <surname>Atkins</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Elshazly</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Guglin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tedford</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wehbe</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Accuracy and consistency of online large language model-based artificial intelligence chat platforms in answering patients' questions about heart failure</article-title>
          <source>Int J Cardiol</source>
          <year>2024</year>
          <month>08</month>
          <day>01</day>
          <volume>408</volume>
          <fpage>132115</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ijcard.2024.132115</pub-id>
          <pub-id pub-id-type="medline">38697402</pub-id>
          <pub-id pub-id-type="pii">S0167-5273(24)00737-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref125">
        <label>125</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hua</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Mei</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Qin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Huo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lv</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Clinical application potential of large language model: a study based on thyroid nodules</article-title>
          <source>Endocrine</source>
          <year>2025</year>
          <month>01</month>
          <day>30</day>
          <volume>87</volume>
          <issue>1</issue>
          <fpage>206</fpage>
          <lpage>213</lpage>
          <pub-id pub-id-type="doi">10.1007/s12020-024-03981-3</pub-id>
          <pub-id pub-id-type="medline">39080210</pub-id>
          <pub-id pub-id-type="pii">10.1007/s12020-024-03981-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref126">
        <label>126</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tessier</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Javidan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Strong</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>McKechnie</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Malone</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kroh</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dang</surname>
              <given-names>JT</given-names>
            </name>
            <collab>ASMBS Artificial Intelligence and Digital Surgery Task Force</collab>
          </person-group>
          <article-title>Harnessing artificial intelligence in bariatric surgery: comparative analysis of ChatGPT-4, Bing, and Bard in generating clinician-level bariatric surgery recommendations</article-title>
          <source>Surg Obes Relat Dis</source>
          <year>2024</year>
          <month>07</month>
          <volume>20</volume>
          <issue>7</issue>
          <fpage>603</fpage>
          <lpage>608</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1550-7289(24)00118-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.soard.2024.03.011</pub-id>
          <pub-id pub-id-type="medline">38644078</pub-id>
          <pub-id pub-id-type="pii">S1550-7289(24)00118-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref127">
        <label>127</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Doğan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Özçakmakcı</surname>
              <given-names>Gazi Bekir</given-names>
            </name>
            <name name-style="western">
              <surname>Yılmaz</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>The performance of chatbots and the AAPOS website as a tool for amblyopia education</article-title>
          <source>J Pediatr Ophthalmol Strabismus</source>
          <year>2024</year>
          <month>04</month>
          <day>25</day>
          <volume>61</volume>
          <issue>5</issue>
          <fpage>325</fpage>
          <lpage>331</lpage>
          <pub-id pub-id-type="doi">10.3928/01913913-20240409-01</pub-id>
          <pub-id pub-id-type="medline">38661309</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref128">
        <label>128</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Campbell</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hossain</surname>
              <given-names>Afif</given-names>
            </name>
            <name name-style="western">
              <surname>Radfar</surname>
              <given-names>Navid</given-names>
            </name>
            <name name-style="western">
              <surname>Siddiqui</surname>
              <given-names>Emaad</given-names>
            </name>
            <name name-style="western">
              <surname>Gardin</surname>
              <given-names>Julius M</given-names>
            </name>
          </person-group>
          <article-title>Unlocking health literacy: the ultimate guide to hypertension education from ChatGPT versus Google Gemini</article-title>
          <source>Cureus</source>
          <year>2024</year>
          <month>05</month>
          <volume>16</volume>
          <issue>5</issue>
          <fpage>e59898</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38721479"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.59898</pub-id>
          <pub-id pub-id-type="medline">38721479</pub-id>
          <pub-id pub-id-type="pmcid">PMC11078260</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref129">
        <label>129</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lang</surname>
              <given-names>SP</given-names>
            </name>
            <name name-style="western">
              <surname>Yoseph</surname>
              <given-names>ET</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzalez-Suarez</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Fatemi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wagner</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Maldaner</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Stienen</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Zygourakis</surname>
              <given-names>CC</given-names>
            </name>
          </person-group>
          <article-title>Analyzing large language models' responses to common lumbar spine fusion surgery questions: a comparison between ChatGPT and Bard</article-title>
          <source>Neurospine</source>
          <year>2024</year>
          <month>06</month>
          <volume>21</volume>
          <issue>2</issue>
          <fpage>633</fpage>
          <lpage>641</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38955533"/>
          </comment>
          <pub-id pub-id-type="doi">10.14245/ns.2448098.049</pub-id>
          <pub-id pub-id-type="medline">38955533</pub-id>
          <pub-id pub-id-type="pii">ns.2448098.049</pub-id>
          <pub-id pub-id-type="pmcid">PMC11224745</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref130">
        <label>130</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Iannantuono</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bracken-Clarke</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Karzai</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Choo-Wosoba</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gulley</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Floudas</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Comparison of large language models in answering immuno-oncology questions: a cross-sectional study</article-title>
          <source>Oncologist</source>
          <year>2024</year>
          <month>05</month>
          <day>03</day>
          <volume>29</volume>
          <issue>5</issue>
          <fpage>407</fpage>
          <lpage>414</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38309720"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/oncolo/oyae009</pub-id>
          <pub-id pub-id-type="medline">38309720</pub-id>
          <pub-id pub-id-type="pii">7600405</pub-id>
          <pub-id pub-id-type="pmcid">PMC11067804</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref131">
        <label>131</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Anguita</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Downie</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ferro Desideri</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sagoo</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>Assessing large language models' accuracy in providing patient support for choroidal melanoma</article-title>
          <source>Eye (Lond)</source>
          <year>2024</year>
          <month>11</month>
          <day>13</day>
          <volume>38</volume>
          <issue>16</issue>
          <fpage>3113</fpage>
          <lpage>3117</lpage>
          <pub-id pub-id-type="doi">10.1038/s41433-024-03231-w</pub-id>
          <pub-id pub-id-type="medline">39003430</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41433-024-03231-w</pub-id>
          <pub-id pub-id-type="pmcid">PMC11544095</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref132">
        <label>132</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Mei</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yeung</surname>
              <given-names>YH</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hua</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Performance of large language models on benign prostatic hyperplasia frequently asked questions</article-title>
          <source>Prostate</source>
          <year>2024</year>
          <month>06</month>
          <volume>84</volume>
          <issue>9</issue>
          <fpage>807</fpage>
          <lpage>813</lpage>
          <pub-id pub-id-type="doi">10.1002/pros.24699</pub-id>
          <pub-id pub-id-type="medline">38558009</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref133">
        <label>133</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xue</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bracken-Clarke</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Iannantuono</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Choo-Wosoba</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gulley</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Floudas</surname>
              <given-names>CS</given-names>
            </name>
          </person-group>
          <article-title>Utility of large language models for health care professionals and patients in navigating hematopoietic stem cell transplantation: comparison of the performance of ChatGPT-3.5, ChatGPT-4, and Bard</article-title>
          <source>J Med Internet Res</source>
          <year>2024</year>
          <month>05</month>
          <day>17</day>
          <volume>26</volume>
          <fpage>e54758</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2024//e54758/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/54758</pub-id>
          <pub-id pub-id-type="medline">38758582</pub-id>
          <pub-id pub-id-type="pii">v26i1e54758</pub-id>
          <pub-id pub-id-type="pmcid">PMC11143389</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref134">
        <label>134</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kwon</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Ghaziani</surname>
              <given-names>TT</given-names>
            </name>
            <name name-style="western">
              <surname>Kwo</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Tse</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kesselman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kamaya</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tse</surname>
              <given-names>JR</given-names>
            </name>
          </person-group>
          <article-title>Large language models' responses to liver cancer surveillance, diagnosis, and management questions: accuracy, reliability, readability</article-title>
          <source>Abdom Radiol (NY)</source>
          <year>2024</year>
          <month>12</month>
          <day>01</day>
          <volume>49</volume>
          <issue>12</issue>
          <fpage>4286</fpage>
          <lpage>4294</lpage>
          <pub-id pub-id-type="doi">10.1007/s00261-024-04501-7</pub-id>
          <pub-id pub-id-type="medline">39088019</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00261-024-04501-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref135">
        <label>135</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Monroe</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Abdelhafez</surname>
              <given-names>YG</given-names>
            </name>
            <name name-style="western">
              <surname>Atsina</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Aman</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Nardo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Madani</surname>
              <given-names>MH</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of responses to cardiac imaging questions by the artificial intelligence large language model ChatGPT</article-title>
          <source>Clin Imaging</source>
          <year>2024</year>
          <month>08</month>
          <volume>112</volume>
          <fpage>110193</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0899-7071(24)00123-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.clinimag.2024.110193</pub-id>
          <pub-id pub-id-type="medline">38820977</pub-id>
          <pub-id pub-id-type="pii">S0899-7071(24)00123-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref136">
        <label>136</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chervonski</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Harish</surname>
              <given-names>KB</given-names>
            </name>
            <name name-style="western">
              <surname>Rockman</surname>
              <given-names>CB</given-names>
            </name>
            <name name-style="western">
              <surname>Sadek</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Teter</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Jacobowitz</surname>
              <given-names>GR</given-names>
            </name>
            <name name-style="western">
              <surname>Berland</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Lohr</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Maldonado</surname>
              <given-names>TS</given-names>
            </name>
          </person-group>
          <article-title>Generative artificial intelligence chatbots may provide appropriate informational responses to common vascular surgery questions by patients</article-title>
          <source>Vascular</source>
          <year>2025</year>
          <month>02</month>
          <day>18</day>
          <volume>33</volume>
          <issue>1</issue>
          <fpage>229</fpage>
          <lpage>237</lpage>
          <pub-id pub-id-type="doi">10.1177/17085381241240550</pub-id>
          <pub-id pub-id-type="medline">38500300</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref137">
        <label>137</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kassab</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hadi El Hajjar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wardrop</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Brateanu</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Accuracy of online artificial intelligence models in primary care settings</article-title>
          <source>Am J Prev Med</source>
          <year>2024</year>
          <month>06</month>
          <volume>66</volume>
          <issue>6</issue>
          <fpage>1054</fpage>
          <lpage>1059</lpage>
          <pub-id pub-id-type="doi">10.1016/j.amepre.2024.02.006</pub-id>
          <pub-id pub-id-type="medline">38354991</pub-id>
          <pub-id pub-id-type="pii">S0749-3797(24)00060-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref138">
        <label>138</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Al-Sharif</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Penteado</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dib El Jalbout</surname>
              <given-names>Nahia</given-names>
            </name>
            <name name-style="western">
              <surname>Topilow</surname>
              <given-names>Nicole J</given-names>
            </name>
            <name name-style="western">
              <surname>Shoji</surname>
              <given-names>Marissa K</given-names>
            </name>
            <name name-style="western">
              <surname>Kikkawa</surname>
              <given-names>Don O</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Catherine Y</given-names>
            </name>
            <name name-style="western">
              <surname>Korn</surname>
              <given-names>Bobby S</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the accuracy of ChatGPT and Google BARD in fielding oculoplastic patient queries: a comparative study on artificial versus human intelligence</article-title>
          <source>Ophthalmic Plast Reconstr Surg</source>
          <year>2024</year>
          <volume>40</volume>
          <issue>3</issue>
          <fpage>303</fpage>
          <lpage>311</lpage>
          <pub-id pub-id-type="doi">10.1097/IOP.0000000000002567</pub-id>
          <pub-id pub-id-type="medline">38215452</pub-id>
          <pub-id pub-id-type="pii">00002341-202405000-00010</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref139">
        <label>139</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mejia</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Arroyave</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Saturno</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ndjonko</surname>
              <given-names>LCM</given-names>
            </name>
            <name name-style="western">
              <surname>Zaidat</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Rajjoub</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zapolsky</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>SK</given-names>
            </name>
          </person-group>
          <article-title>Use of ChatGPT for determining clinical and surgical treatment of lumbar disc herniation with radiculopathy: a North American Spine Society guideline comparison</article-title>
          <source>Neurospine</source>
          <year>2024</year>
          <month>03</month>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>149</fpage>
          <lpage>158</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38291746"/>
          </comment>
          <pub-id pub-id-type="doi">10.14245/ns.2347052.526</pub-id>
          <pub-id pub-id-type="medline">38291746</pub-id>
          <pub-id pub-id-type="pii">ns.2347052.526</pub-id>
          <pub-id pub-id-type="pmcid">PMC10992643</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref140">
        <label>140</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Rao</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Campbell</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Radfar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Dayal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Khrais</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Evaluating ChatGPT-3.5 and ChatGPT-4.0 responses on hyperlipidemia for patient education</article-title>
          <source>Cureus</source>
          <year>2024</year>
          <month>05</month>
          <volume>16</volume>
          <issue>5</issue>
          <fpage>e61067</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38803402"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.61067</pub-id>
          <pub-id pub-id-type="medline">38803402</pub-id>
          <pub-id pub-id-type="pmcid">PMC11128363</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref141">
        <label>141</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Oliveira</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Coelho</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Guedes</surname>
              <given-names>LC</given-names>
            </name>
            <name name-style="western">
              <surname>Cattoni</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Carvalho</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Duarte-Batista</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT 3.5 and 4 as a tool for patient support before and after DBS surgery for Parkinson's disease</article-title>
          <source>Neurol Sci</source>
          <year>2024</year>
          <month>12</month>
          <day>29</day>
          <volume>45</volume>
          <issue>12</issue>
          <fpage>5757</fpage>
          <lpage>5764</lpage>
          <pub-id pub-id-type="doi">10.1007/s10072-024-07732-0</pub-id>
          <pub-id pub-id-type="medline">39198356</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10072-024-07732-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC11554841</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref142">
        <label>142</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>ZW</given-names>
            </name>
            <name name-style="western">
              <surname>Pushpanathan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yew</surname>
              <given-names>SME</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lam</surname>
              <given-names>JSH</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>DZ</given-names>
            </name>
            <name name-style="western">
              <surname>Goh</surname>
              <given-names>JHL</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>MCJ</given-names>
            </name>
            <name name-style="western">
              <surname>Sheng</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Koh</surname>
              <given-names>VTC</given-names>
            </name>
            <name name-style="western">
              <surname>Tham</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Benchmarking large language models' performances for myopia care: a comparative analysis of ChatGPT-3.5, ChatGPT-4.0, and Google Bard</article-title>
          <source>EBioMedicine</source>
          <year>2023</year>
          <month>09</month>
          <volume>95</volume>
          <fpage>104770</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2352-3964(23)00336-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ebiom.2023.104770</pub-id>
          <pub-id pub-id-type="medline">37625267</pub-id>
          <pub-id pub-id-type="pii">S2352-3964(23)00336-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC10470220</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref143">
        <label>143</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rahsepar</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Tavakoli</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>GHJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hassani</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Abtin</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Bedayat</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>How AI responds to common lung cancer questions: ChatGPT vs Google Bard</article-title>
          <source>Radiology</source>
          <year>2023</year>
          <month>06</month>
          <volume>307</volume>
          <issue>5</issue>
          <fpage>e230922</fpage>
          <pub-id pub-id-type="doi">10.1148/radiol.230922</pub-id>
          <pub-id pub-id-type="medline">37310252</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref144">
        <label>144</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pushpanathan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>ZW</given-names>
            </name>
            <name name-style="western">
              <surname>Er Yew</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>DZ</given-names>
            </name>
            <name name-style="western">
              <surname>Hui'En Lin</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Lin Goh</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>WM</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Jin Tan</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Chang Koh</surname>
              <given-names>VT</given-names>
            </name>
            <name name-style="western">
              <surname>Tham</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Popular large language model chatbots' accuracy, comprehensiveness, and self-awareness in answering ocular symptom queries</article-title>
          <source>iScience</source>
          <year>2023</year>
          <month>11</month>
          <day>17</day>
          <volume>26</volume>
          <issue>11</issue>
          <fpage>108163</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2589-0042(23)02240-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.isci.2023.108163</pub-id>
          <pub-id pub-id-type="medline">37915603</pub-id>
          <pub-id pub-id-type="pii">S2589-0042(23)02240-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC10616302</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref145">
        <label>145</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Coskun</surname>
              <given-names>BN</given-names>
            </name>
            <name name-style="western">
              <surname>Yagiz</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ocakoglu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Dalkilic</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Pehlivan</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Assessing the accuracy and completeness of artificial intelligence language models in providing information on methotrexate use</article-title>
          <source>Rheumatol Int</source>
          <year>2024</year>
          <month>03</month>
          <day>25</day>
          <volume>44</volume>
          <issue>3</issue>
          <fpage>509</fpage>
          <lpage>515</lpage>
          <pub-id pub-id-type="doi">10.1007/s00296-023-05473-5</pub-id>
          <pub-id pub-id-type="medline">37747564</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00296-023-05473-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref146">
        <label>146</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>King</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Samaan</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Yeo</surname>
              <given-names>YH</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kunkel</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Habib</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Ghashghaei</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>A multidisciplinary assessment of ChatGPT's knowledge of amyloidosis: observational study</article-title>
          <source>JMIR Cardio</source>
          <year>2024</year>
          <month>04</month>
          <day>19</day>
          <volume>8</volume>
          <fpage>e53421</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cardio.jmir.org/2024//e53421/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/53421</pub-id>
          <pub-id pub-id-type="medline">38640472</pub-id>
          <pub-id pub-id-type="pii">v8i1e53421</pub-id>
          <pub-id pub-id-type="pmcid">PMC11069089</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref147">
        <label>147</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pinto</surname>
              <given-names>VBP</given-names>
            </name>
            <name name-style="western">
              <surname>de Azevedo</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Wroclawski</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Gentile</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Jesus</surname>
              <given-names>VLM</given-names>
            </name>
            <name name-style="western">
              <surname>de Bessa Junior</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nahas</surname>
              <given-names>WC</given-names>
            </name>
            <name name-style="western">
              <surname>Sacomani</surname>
              <given-names>CAR</given-names>
            </name>
            <name name-style="western">
              <surname>Sandhu</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Gomes</surname>
              <given-names>CM</given-names>
            </name>
          </person-group>
          <article-title>Conformity of ChatGPT recommendations with the AUA/SUFU guideline on postprostatectomy urinary incontinence</article-title>
          <source>Neurourol Urodyn</source>
          <year>2024</year>
          <month>04</month>
          <day>07</day>
          <volume>43</volume>
          <issue>4</issue>
          <fpage>935</fpage>
          <lpage>941</lpage>
          <pub-id pub-id-type="doi">10.1002/nau.25442</pub-id>
          <pub-id pub-id-type="medline">38451040</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref148">
        <label>148</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Momenaei</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Wakabayashi</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Shahlaee</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Durrani</surname>
              <given-names>AF</given-names>
            </name>
            <name name-style="western">
              <surname>Pandit</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mansour</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Abishek</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sridhar</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yonekawa</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kuriyan</surname>
              <given-names>AE</given-names>
            </name>
          </person-group>
          <article-title>Assessing ChatGPT-3.5 versus ChatGPT-4 performance in surgical treatment of retinal diseases: a comparative study</article-title>
          <source>Ophthalmic Surg Lasers Imaging Retina</source>
          <year>2024</year>
          <month>08</month>
          <volume>55</volume>
          <issue>8</issue>
          <fpage>481</fpage>
          <lpage>482</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.healio.com/doi/abs/10.3928/23258160-20240227-02?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.3928/23258160-20240227-02</pub-id>
          <pub-id pub-id-type="medline">38531015</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref149">
        <label>149</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stevenson</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Walsh</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hibberd</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Can artificial intelligence replace biochemists? A study comparing interpretation of thyroid function test results by ChatGPT and Google Bard to practising biochemists</article-title>
          <source>Ann Clin Biochem</source>
          <year>2024</year>
          <month>03</month>
          <day>20</day>
          <volume>61</volume>
          <issue>2</issue>
          <fpage>143</fpage>
          <lpage>149</lpage>
          <pub-id pub-id-type="doi">10.1177/00045632231203473</pub-id>
          <pub-id pub-id-type="medline">37699796</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref150">
        <label>150</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dronkers</surname>
              <given-names>EAC</given-names>
            </name>
            <name name-style="western">
              <surname>Geneid</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Al Yaghchi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lechien</surname>
              <given-names>JR</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the potential of AI chatbots in treatment decision-making for acquired bilateral vocal fold paralysis in adults</article-title>
          <source>J Voice</source>
          <year>2024</year>
          <month>04</month>
          <day>06</day>
          <fpage>1</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0892-1997(24)00059-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jvoice.2024.02.020</pub-id>
          <pub-id pub-id-type="medline">38584026</pub-id>
          <pub-id pub-id-type="pii">S0892-1997(24)00059-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref151">
        <label>151</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rahimli Ocakoglu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Coskun</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>The emerging role of AI in patient education: a comparative analysis of LLM accuracy for pelvic organ prolapse</article-title>
          <source>Med Princ Pract</source>
          <year>2024</year>
          <month>03</month>
          <day>25</day>
          <volume>33</volume>
          <issue>4</issue>
          <fpage>330</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1159/000538538"/>
          </comment>
          <pub-id pub-id-type="doi">10.1159/000538538</pub-id>
          <pub-id pub-id-type="medline">38527444</pub-id>
          <pub-id pub-id-type="pii">000538538</pub-id>
          <pub-id pub-id-type="pmcid">PMC11324208</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref152">
        <label>152</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gandhi</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Joesph</surname>
              <given-names>FK</given-names>
            </name>
            <name name-style="western">
              <surname>Rajagopal</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Aparnavi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Katkuri</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dayama</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Satapathy</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Khatib</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Gaidhane</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zahiruddin</surname>
              <given-names>QS</given-names>
            </name>
            <name name-style="western">
              <surname>Behera</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT on the India undergraduate community medicine examination: cross-sectional study</article-title>
          <source>JMIR Form Res</source>
          <year>2024</year>
          <month>03</month>
          <day>25</day>
          <volume>8</volume>
          <fpage>e49964</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://formative.jmir.org/2024//e49964/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/49964</pub-id>
          <pub-id pub-id-type="medline">38526538</pub-id>
          <pub-id pub-id-type="pii">v8i1e49964</pub-id>
          <pub-id pub-id-type="pmcid">PMC11002731</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref153">
        <label>153</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tariq</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Malik</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Khanna</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Evolving landscape of large language models: an evaluation of ChatGPT and Bard in answering patient queries on colonoscopy</article-title>
          <source>Gastroenterology</source>
          <year>2024</year>
          <month>01</month>
          <volume>166</volume>
          <issue>1</issue>
          <fpage>220</fpage>
          <lpage>221</lpage>
          <pub-id pub-id-type="doi">10.1053/j.gastro.2023.08.033</pub-id>
          <pub-id pub-id-type="medline">37634736</pub-id>
          <pub-id pub-id-type="pii">S0016-5085(23)04916-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref154">
        <label>154</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sheng</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tham</surname>
              <given-names>YC</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>TY</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Potential multidisciplinary use of large language models for addressing queries in cardio-oncology</article-title>
          <source>J Am Heart Assoc</source>
          <year>2024</year>
          <month>03</month>
          <day>19</day>
          <volume>13</volume>
          <issue>6</issue>
          <fpage>e033584</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ahajournals.org/doi/abs/10.1161/JAHA.123.033584?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1161/JAHA.123.033584</pub-id>
          <pub-id pub-id-type="medline">38497458</pub-id>
          <pub-id pub-id-type="pmcid">PMC11010006</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref155">
        <label>155</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sosa</surname>
              <given-names>BR</given-names>
            </name>
            <name name-style="western">
              <surname>Cung</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Suhardi</surname>
              <given-names>VJ</given-names>
            </name>
            <name name-style="western">
              <surname>Morse</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Thomson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Iyer</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Greenblatt</surname>
              <given-names>MB</given-names>
            </name>
          </person-group>
          <article-title>Capacity for large language model chatbots to aid in orthopedic management, research, and patient queries</article-title>
          <source>J Orthop Res</source>
          <year>2024</year>
          <month>06</month>
          <day>21</day>
          <volume>42</volume>
          <issue>6</issue>
          <fpage>1276</fpage>
          <lpage>1282</lpage>
          <pub-id pub-id-type="doi">10.1002/jor.25782</pub-id>
          <pub-id pub-id-type="medline">38245845</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref156">
        <label>156</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Koga</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>NB</given-names>
            </name>
            <name name-style="western">
              <surname>Dickson</surname>
              <given-names>DW</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the performance of large language models: ChatGPT and Google Bard in generating differential diagnoses in clinicopathological conferences of neurodegenerative disorders</article-title>
          <source>Brain Pathol</source>
          <year>2024</year>
          <month>05</month>
          <day>08</day>
          <volume>34</volume>
          <issue>3</issue>
          <fpage>e13207</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37553205"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/bpa.13207</pub-id>
          <pub-id pub-id-type="medline">37553205</pub-id>
          <pub-id pub-id-type="pmcid">PMC11006994</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref157">
        <label>157</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Warrier</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Haleem</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zaki</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Eloy</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>The comparative diagnostic capability of large language models in otolaryngology</article-title>
          <source>Laryngoscope</source>
          <year>2024</year>
          <month>09</month>
          <day>02</day>
          <volume>134</volume>
          <issue>9</issue>
          <fpage>3997</fpage>
          <lpage>4002</lpage>
          <pub-id pub-id-type="doi">10.1002/lary.31434</pub-id>
          <pub-id pub-id-type="medline">38563415</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref158">
        <label>158</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>RP</given-names>
            </name>
            <name name-style="western">
              <surname>Sivan</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Bachir</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Sarwar</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Ruzicka</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>O'Malley</surname>
              <given-names>GR</given-names>
            </name>
            <name name-style="western">
              <surname>Lobo</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Morales</surname>
              <given-names>IC</given-names>
            </name>
            <name name-style="western">
              <surname>Cassimatis</surname>
              <given-names>ND</given-names>
            </name>
            <name name-style="western">
              <surname>Hundal</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>NV</given-names>
            </name>
          </person-group>
          <article-title>Can artificial intelligence mitigate missed diagnoses by generating differential diagnoses for neurosurgeons?</article-title>
          <source>World Neurosurg</source>
          <year>2024</year>
          <month>07</month>
          <volume>187</volume>
          <fpage>e1083</fpage>
          <lpage>e1088</lpage>
          <pub-id pub-id-type="doi">10.1016/j.wneu.2024.05.052</pub-id>
          <pub-id pub-id-type="medline">38759788</pub-id>
          <pub-id pub-id-type="pii">S1878-8750(24)00814-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref159">
        <label>159</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hirosawa</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Harada</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Mizuta</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Sakamoto</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tokumasu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Shimizu</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Diagnostic performance of generative artificial intelligences for a series of complex case reports</article-title>
          <source>Digit Health</source>
          <year>2024</year>
          <month>07</month>
          <day>21</day>
          <volume>10</volume>
          <fpage>20552076241265215</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/20552076241265215?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/20552076241265215</pub-id>
          <pub-id pub-id-type="medline">39229463</pub-id>
          <pub-id pub-id-type="pii">10.1177_20552076241265215</pub-id>
          <pub-id pub-id-type="pmcid">PMC11369864</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref160">
        <label>160</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mandalos</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tsouris</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Artificial versus human intelligence in the diagnostic approach of ophthalmic case scenarios: a qualitative evaluation of performance and consistency</article-title>
          <source>Cureus</source>
          <year>2024</year>
          <month>06</month>
          <volume>16</volume>
          <issue>6</issue>
          <fpage>e62471</fpage>
          <pub-id pub-id-type="doi">10.7759/cureus.62471</pub-id>
          <pub-id pub-id-type="medline">39015855</pub-id>
          <pub-id pub-id-type="pmcid">PMC11251728</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref161">
        <label>161</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Krusche</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Callhoff</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Knitza</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ruffer</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Diagnostic accuracy of a large language model in rheumatology: comparison of physician and ChatGPT-4</article-title>
          <source>Rheumatol Int</source>
          <year>2024</year>
          <month>02</month>
          <day>24</day>
          <volume>44</volume>
          <issue>2</issue>
          <fpage>303</fpage>
          <lpage>306</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37742280"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s00296-023-05464-6</pub-id>
          <pub-id pub-id-type="medline">37742280</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00296-023-05464-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC10796566</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref162">
        <label>162</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Delsoz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Madadi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Raja</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Munir</surname>
              <given-names>WM</given-names>
            </name>
            <name name-style="western">
              <surname>Tamm</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Mehravaran</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Soleimani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Djalilian</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yousefi</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT in diagnosis of corneal eye diseases</article-title>
          <source>Cornea</source>
          <year>2024</year>
          <month>05</month>
          <day>01</day>
          <volume>43</volume>
          <issue>5</issue>
          <fpage>664</fpage>
          <lpage>670</lpage>
          <pub-id pub-id-type="doi">10.1097/ICO.0000000000003492</pub-id>
          <pub-id pub-id-type="medline">38391243</pub-id>
          <pub-id pub-id-type="pii">00003226-202405000-00019</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref163">
        <label>163</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kozel</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gurses</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Gecici</surname>
              <given-names>NN</given-names>
            </name>
            <name name-style="western">
              <surname>Gökalp</surname>
              <given-names>Elif</given-names>
            </name>
            <name name-style="western">
              <surname>Bahadir</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Merenzon</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>AH</given-names>
            </name>
            <name name-style="western">
              <surname>Komotar</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ivan</surname>
              <given-names>ME</given-names>
            </name>
          </person-group>
          <article-title>Chat-GPT on brain tumors: an examination of artificial intelligence/machine learning's ability to provide diagnoses and treatment plans for example neuro-oncology cases</article-title>
          <source>Clin Neurol Neurosurg</source>
          <year>2024</year>
          <month>04</month>
          <volume>239</volume>
          <fpage>108238</fpage>
          <pub-id pub-id-type="doi">10.1016/j.clineuro.2024.108238</pub-id>
          <pub-id pub-id-type="medline">38507989</pub-id>
          <pub-id pub-id-type="pii">S0303-8467(24)00125-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref164">
        <label>164</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stoneham</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Livesey</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Mitchell</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT versus clinician: challenging the diagnostic capabilities of artificial intelligence in dermatology</article-title>
          <source>Clin Exp Dermatol</source>
          <year>2024</year>
          <month>06</month>
          <day>25</day>
          <volume>49</volume>
          <issue>7</issue>
          <fpage>707</fpage>
          <lpage>710</lpage>
          <pub-id pub-id-type="doi">10.1093/ced/llad402</pub-id>
          <pub-id pub-id-type="medline">37979201</pub-id>
          <pub-id pub-id-type="pii">7429032</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref165">
        <label>165</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Albaladejo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lorleac'h</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Allain</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>[The spring of artificial intelligence: AI vs. expert for internal medicine cases]</article-title>
          <source>Rev Med Interne</source>
          <year>2024</year>
          <month>07</month>
          <volume>45</volume>
          <issue>7</issue>
          <fpage>409</fpage>
          <lpage>414</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0248-8663(24)00032-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.revmed.2024.01.012</pub-id>
          <pub-id pub-id-type="medline">38331591</pub-id>
          <pub-id pub-id-type="pii">S0248-8663(24)00032-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref166">
        <label>166</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zandi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Fahey</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Drakopoulos</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bryan</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bryar</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bidwell</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Bowen</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Lavine</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Mirza</surname>
              <given-names>RG</given-names>
            </name>
          </person-group>
          <article-title>Exploring diagnostic precision and triage proficiency: a comparative study of GPT-4 and Bard in addressing common ophthalmic complaints</article-title>
          <source>Bioengineering (Basel)</source>
          <year>2024</year>
          <month>01</month>
          <day>26</day>
          <volume>11</volume>
          <issue>2</issue>
          <fpage>120</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=bioengineering11020120"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/bioengineering11020120</pub-id>
          <pub-id pub-id-type="medline">38391606</pub-id>
          <pub-id pub-id-type="pii">bioengineering11020120</pub-id>
          <pub-id pub-id-type="pmcid">PMC10886029</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref167">
        <label>167</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hirosawa</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kawamura</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Harada</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Mizuta</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tokumasu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kaji</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Suzuki</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Shimizu</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT-generated differential diagnosis lists for complex case-derived clinical vignettes: diagnostic accuracy evaluation</article-title>
          <source>JMIR Med Inform</source>
          <year>2023</year>
          <month>10</month>
          <day>09</day>
          <volume>11</volume>
          <fpage>e48808</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2023//e48808/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/48808</pub-id>
          <pub-id pub-id-type="medline">37812468</pub-id>
          <pub-id pub-id-type="pii">v11i1e48808</pub-id>
          <pub-id pub-id-type="pmcid">PMC10594139</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref168">
        <label>168</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hirosawa</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Harada</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yokose</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sakamoto</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kawamura</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Shimizu</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Diagnostic accuracy of differential-diagnosis lists generated by Generative Pretrained Transformer 3 Chatbot for clinical vignettes with common chief complaints: a pilot study</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2023</year>
          <month>02</month>
          <day>15</day>
          <volume>20</volume>
          <issue>4</issue>
          <fpage>3378</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph20043378"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph20043378</pub-id>
          <pub-id pub-id-type="medline">36834073</pub-id>
          <pub-id pub-id-type="pii">ijerph20043378</pub-id>
          <pub-id pub-id-type="pmcid">PMC9967747</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref169">
        <label>169</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fraser</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Crossland</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bacher</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Ranney</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Madsen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Hilliard</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Comparison of diagnostic and triage accuracy of Ada Health and WebMD symptom checkers, ChatGPT, and Physicians for Patients in an emergency department: clinical data analysis study</article-title>
          <source>JMIR Mhealth Uhealth</source>
          <year>2023</year>
          <month>10</month>
          <day>03</day>
          <volume>11</volume>
          <fpage>e49995</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mhealth.jmir.org/2023//e49995/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/49995</pub-id>
          <pub-id pub-id-type="medline">37788063</pub-id>
          <pub-id pub-id-type="pii">v11i1e49995</pub-id>
          <pub-id pub-id-type="pmcid">PMC10582809</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref170">
        <label>170</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rojas-Carabali</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Cifuentes-González</surname>
              <given-names>Carlos</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Putera</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Sen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Thng</surname>
              <given-names>ZX</given-names>
            </name>
            <name name-style="western">
              <surname>Agrawal</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Elze</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Sobrin</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Kempen</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Biswas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>QD</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>de-la-Torre</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Agrawal</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the diagnostic accuracy and management recommendations of ChatGPT in uveitis</article-title>
          <source>Ocul Immunol Inflamm</source>
          <year>2024</year>
          <month>10</month>
          <day>18</day>
          <volume>32</volume>
          <issue>8</issue>
          <fpage>1526</fpage>
          <lpage>1531</lpage>
          <pub-id pub-id-type="doi">10.1080/09273948.2023.2253471</pub-id>
          <pub-id pub-id-type="medline">37722842</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref171">
        <label>171</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gräf</surname>
              <given-names>Markus</given-names>
            </name>
            <name name-style="western">
              <surname>Knitza</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Leipe</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Krusche</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Welcker</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kuhn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mucke</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hueber</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hornig</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Klemm</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kleinert</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Aries</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Vuillerme</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Simon</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kleyer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schett</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Callhoff</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Comparison of physician and artificial intelligence-based symptom checker diagnostic accuracy</article-title>
          <source>Rheumatol Int</source>
          <year>2022</year>
          <month>12</month>
          <volume>42</volume>
          <issue>12</issue>
          <fpage>2167</fpage>
          <lpage>2176</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36087130"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s00296-022-05202-4</pub-id>
          <pub-id pub-id-type="medline">36087130</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00296-022-05202-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC9548469</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref172">
        <label>172</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ward</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Unadkat</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Toscano</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kashanian</surname>
              <given-names>Alon</given-names>
            </name>
            <name name-style="western">
              <surname>Lynch</surname>
              <given-names>Daniel G</given-names>
            </name>
            <name name-style="western">
              <surname>Horn</surname>
              <given-names>Alexander C</given-names>
            </name>
            <name name-style="western">
              <surname>D'Amico</surname>
              <given-names>Randy S</given-names>
            </name>
            <name name-style="western">
              <surname>Mittler</surname>
              <given-names>Mark</given-names>
            </name>
            <name name-style="western">
              <surname>Baum</surname>
              <given-names>Griffin R</given-names>
            </name>
          </person-group>
          <article-title>A quantitative assessment of ChatGPT as a neurosurgical triaging tool</article-title>
          <source>Neurosurgery</source>
          <year>2024</year>
          <month>08</month>
          <day>01</day>
          <volume>95</volume>
          <issue>2</issue>
          <fpage>487</fpage>
          <lpage>495</lpage>
          <pub-id pub-id-type="doi">10.1227/neu.0000000000002867</pub-id>
          <pub-id pub-id-type="medline">38353523</pub-id>
          <pub-id pub-id-type="pii">00006123-990000000-01055</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref173">
        <label>173</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hirosawa</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mizuta</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Harada</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shimizu</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Comparative evaluation of diagnostic accuracy between Google Bard and physicians</article-title>
          <source>Am J Med</source>
          <year>2023</year>
          <month>11</month>
          <volume>136</volume>
          <issue>11</issue>
          <fpage>1119</fpage>
          <lpage>1123.e18</lpage>
          <pub-id pub-id-type="doi">10.1016/j.amjmed.2023.08.003</pub-id>
          <pub-id pub-id-type="medline">37643659</pub-id>
          <pub-id pub-id-type="pii">S0002-9343(23)00536-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref174">
        <label>174</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lyons</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Arepalli</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Fromal</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Jain</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence chatbot performance in triage of ophthalmic conditions</article-title>
          <source>Can J Ophthalmol</source>
          <year>2024</year>
          <month>08</month>
          <volume>59</volume>
          <issue>4</issue>
          <fpage>e301</fpage>
          <lpage>e308</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jcjo.2023.07.016</pub-id>
          <pub-id pub-id-type="medline">37572695</pub-id>
          <pub-id pub-id-type="pii">S0008-4182(23)00234-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref175">
        <label>175</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Makhoul</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Melkane</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Khoury</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Hadi</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Matar</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>A cross-sectional comparative study: ChatGPT 3.5 versus diverse levels of medical experts in the diagnosis of ENT diseases</article-title>
          <source>Eur Arch Otorhinolaryngol</source>
          <year>2024</year>
          <month>05</month>
          <day>16</day>
          <volume>281</volume>
          <issue>5</issue>
          <fpage>2717</fpage>
          <lpage>2721</lpage>
          <pub-id pub-id-type="doi">10.1007/s00405-024-08509-z</pub-id>
          <pub-id pub-id-type="medline">38365990</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00405-024-08509-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref176">
        <label>176</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shemer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Altarescu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Atar-Vardi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hecht</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Dubinsky-Pertzov</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Shoshany</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Zmujack</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Or</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Einan-Lifshitz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pras</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Diagnostic capabilities of ChatGPT in ophthalmology</article-title>
          <source>Graefes Arch Clin Exp Ophthalmol</source>
          <year>2024</year>
          <month>07</month>
          <day>06</day>
          <volume>262</volume>
          <issue>7</issue>
          <fpage>2345</fpage>
          <lpage>2352</lpage>
          <pub-id pub-id-type="doi">10.1007/s00417-023-06363-z</pub-id>
          <pub-id pub-id-type="medline">38183467</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00417-023-06363-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref177">
        <label>177</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gunes</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cesur</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>The diagnostic performance of large language models and general radiologists in thoracic radiology cases: a comparative study</article-title>
          <source>J Thorac Imaging</source>
          <year>2024</year>
          <month>09</month>
          <day>13</day>
          <fpage>2024</fpage>
          <pub-id pub-id-type="doi">10.1097/RTI.0000000000000805</pub-id>
          <pub-id pub-id-type="medline">39269227</pub-id>
          <pub-id pub-id-type="pii">00005382-990000000-00153</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref178">
        <label>178</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sarangi</surname>
              <given-names>PK</given-names>
            </name>
            <name name-style="western">
              <surname>Irodi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Panda</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nayak</surname>
              <given-names>DSK</given-names>
            </name>
            <name name-style="western">
              <surname>Mondal</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Radiological differential diagnoses based on cardiovascular and thoracic imaging patterns: perspectives of four large language models</article-title>
          <source>Indian J Radiol Imaging</source>
          <year>2024</year>
          <month>04</month>
          <day>28</day>
          <volume>34</volume>
          <issue>2</issue>
          <fpage>269</fpage>
          <lpage>275</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.thieme-connect.com/DOI/DOI?10.1055/s-0043-1777289"/>
          </comment>
          <pub-id pub-id-type="doi">10.1055/s-0043-1777289</pub-id>
          <pub-id pub-id-type="medline">38549881</pub-id>
          <pub-id pub-id-type="pii">IJRI-23-9-2923</pub-id>
          <pub-id pub-id-type="pmcid">PMC10972667</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref179">
        <label>179</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Berg</surname>
              <given-names>HT</given-names>
            </name>
            <name name-style="western">
              <surname>van Bakel</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>van de Wouw</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jie</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Schipper</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jansen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>O'Connor</surname>
              <given-names>Rory D</given-names>
            </name>
            <name name-style="western">
              <surname>van Ginneken</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kurstjens</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT and generating a differential diagnosis early in an emergency department presentation</article-title>
          <source>Ann Emerg Med</source>
          <year>2024</year>
          <month>01</month>
          <volume>83</volume>
          <issue>1</issue>
          <fpage>83</fpage>
          <lpage>86</lpage>
          <pub-id pub-id-type="doi">10.1016/j.annemergmed.2023.08.003</pub-id>
          <pub-id pub-id-type="medline">37690022</pub-id>
          <pub-id pub-id-type="pii">S0196-0644(23)00642-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref180">
        <label>180</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haider</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Pressman</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Borna</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gomez-Cabello</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Sehgal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Leibovich</surname>
              <given-names>BC</given-names>
            </name>
            <name name-style="western">
              <surname>Forte</surname>
              <given-names>AJ</given-names>
            </name>
          </person-group>
          <article-title>Evaluating large language model (LLM) performance on established breast classification systems</article-title>
          <source>Diagnostics (Basel)</source>
          <year>2024</year>
          <month>07</month>
          <day>11</day>
          <volume>14</volume>
          <issue>14</issue>
          <fpage>1491</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=diagnostics14141491"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/diagnostics14141491</pub-id>
          <pub-id pub-id-type="medline">39061628</pub-id>
          <pub-id pub-id-type="pii">diagnostics14141491</pub-id>
          <pub-id pub-id-type="pmcid">PMC11275570</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref181">
        <label>181</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gan</surname>
              <given-names>RK</given-names>
            </name>
            <name name-style="western">
              <surname>Ogbodo</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Wee</surname>
              <given-names>YZ</given-names>
            </name>
            <name name-style="western">
              <surname>Gan</surname>
              <given-names>AZ</given-names>
            </name>
            <name name-style="western">
              <surname>González</surname>
              <given-names>Pedro Arcos</given-names>
            </name>
          </person-group>
          <article-title>Performance of Google bard and ChatGPT in mass casualty incidents triage</article-title>
          <source>Am J Emerg Med</source>
          <year>2024</year>
          <month>01</month>
          <volume>75</volume>
          <fpage>72</fpage>
          <lpage>78</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0735-6757(23)00576-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ajem.2023.10.034</pub-id>
          <pub-id pub-id-type="medline">37967485</pub-id>
          <pub-id pub-id-type="pii">S0735-6757(23)00576-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref182">
        <label>182</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aiumtrakul</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Thongprayoon</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Arayangkool</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Vo</surname>
              <given-names>KB</given-names>
            </name>
            <name name-style="western">
              <surname>Wannaphut</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Suppadungsuk</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Krisanapan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Garcia Valencia</surname>
              <given-names>OA</given-names>
            </name>
            <name name-style="western">
              <surname>Qureshi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Miao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cheungpasitporn</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Personalized medicine in urolithiasis: AI chatbot-assisted dietary management of oxalate for kidney stone prevention</article-title>
          <source>J Pers Med</source>
          <year>2024</year>
          <month>01</month>
          <day>18</day>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>107</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=jpm14010107"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/jpm14010107</pub-id>
          <pub-id pub-id-type="medline">38248809</pub-id>
          <pub-id pub-id-type="pii">jpm14010107</pub-id>
          <pub-id pub-id-type="pmcid">PMC10817681</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref183">
        <label>183</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Dantona</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hull</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>DRG-LLaMA: tuning LLaMA model to predict diagnosis-related group for hospitalized patients</article-title>
          <source>NPJ Digit Med</source>
          <year>2024</year>
          <month>01</month>
          <day>22</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>16</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-023-00989-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-023-00989-3</pub-id>
          <pub-id pub-id-type="medline">38253711</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-023-00989-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC10803802</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref184">
        <label>184</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Singhal</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Azizi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mahdavi</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>HW</given-names>
            </name>
            <name name-style="western">
              <surname>Scales</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Tanwani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cole-Lewis</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Pfohl</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Payne</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Seneviratne</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gamble</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kelly</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Babiker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schärli</surname>
              <given-names>Nathanael</given-names>
            </name>
            <name name-style="western">
              <surname>Chowdhery</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mansfield</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Demner-Fushman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Agüera Y Arcas</surname>
              <given-names>Blaise</given-names>
            </name>
            <name name-style="western">
              <surname>Webster</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Matias</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chou</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gottweis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tomasev</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rajkomar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Barral</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Semturs</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Karthikesalingam</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Natarajan</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Large language models encode clinical knowledge</article-title>
          <source>Nature</source>
          <year>2023</year>
          <month>08</month>
          <volume>620</volume>
          <issue>7972</issue>
          <fpage>172</fpage>
          <lpage>180</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37438534"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41586-023-06291-2</pub-id>
          <pub-id pub-id-type="medline">37438534</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41586-023-06291-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC10396962</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref185">
        <label>185</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thirunavukarasu</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ting</surname>
              <given-names>DSJ</given-names>
            </name>
            <name name-style="western">
              <surname>Elangovan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gutierrez</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>TF</given-names>
            </name>
            <name name-style="western">
              <surname>Ting</surname>
              <given-names>DSW</given-names>
            </name>
          </person-group>
          <article-title>Large language models in medicine</article-title>
          <source>Nat Med</source>
          <year>2023</year>
          <month>08</month>
          <day>17</day>
          <volume>29</volume>
          <issue>8</issue>
          <fpage>1930</fpage>
          <lpage>1940</lpage>
          <pub-id pub-id-type="doi">10.1038/s41591-023-02448-8</pub-id>
          <pub-id pub-id-type="medline">37460753</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-023-02448-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref186">
        <label>186</label>
        <nlm-citation citation-type="web">
          <article-title>Researcher Access Program application</article-title>
          <source>OpenAI</source>
          <access-date>2025-04-21</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://platform.openai.com/docs/model-index-for-researchers">https://platform.openai.com/docs/model-index-for-researchers</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref187">
        <label>187</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Afvari</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Pre-trained multimodal large language model enhances dermatological diagnosis using SkinGPT-4</article-title>
          <source>Nat Commun</source>
          <year>2024</year>
          <month>07</month>
          <day>05</day>
          <volume>15</volume>
          <issue>1</issue>
          <fpage>5649</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41467-024-50043-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41467-024-50043-3</pub-id>
          <pub-id pub-id-type="medline">38969632</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41467-024-50043-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC11226626</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref188">
        <label>188</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Dan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>ChatDoctor: a medical chat model fine-tuned on a large language model meta-AI (LLaMA) using medical domain knowledge</article-title>
          <source>Cureus</source>
          <year>2023</year>
          <month>06</month>
          <volume>15</volume>
          <issue>6</issue>
          <fpage>e40895</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37492832"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.40895</pub-id>
          <pub-id pub-id-type="medline">37492832</pub-id>
          <pub-id pub-id-type="pmcid">PMC10364849</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref189">
        <label>189</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bagde</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Dhopte</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Alam</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Basri</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>A systematic review and meta-analysis on ChatGPT and its utilization in medical and dental research</article-title>
          <source>Heliyon</source>
          <year>2023</year>
          <month>12</month>
          <volume>9</volume>
          <issue>12</issue>
          <fpage>e23050</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2405-8440(23)10258-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.heliyon.2023.e23050</pub-id>
          <pub-id pub-id-type="medline">38144348</pub-id>
          <pub-id pub-id-type="pii">S2405-8440(23)10258-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC10746423</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref190">
        <label>190</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Levin</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Horesh</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Brezinov</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT in medical examinations: a systematic review and a meta-analysis</article-title>
          <source>BJOG</source>
          <year>2024</year>
          <month>02</month>
          <volume>131</volume>
          <issue>3</issue>
          <fpage>378</fpage>
          <lpage>380</lpage>
          <pub-id pub-id-type="doi">10.1111/1471-0528.17641</pub-id>
          <pub-id pub-id-type="medline">37604703</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
