<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="letter" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v26i1e67409</article-id>
      <article-id pub-id-type="pmid">39642373</article-id>
      <article-id pub-id-type="doi">10.2196/67409</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Research Letter</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Research Letter</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>The Triage and Diagnostic Accuracy of Frontier Large Language Models: Updated Comparison to Physician Performance</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Williams</surname>
            <given-names>Christopher</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Shi</surname>
            <given-names>Qiming</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Sorich</surname>
            <given-names>Michael Joseph</given-names>
          </name>
          <degrees>BPharm, GradDipMedStat, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>College of Medicine and Public Health</institution>
            <institution>Flinders University</institution>
            <addr-line>GPO Box 2100</addr-line>
            <addr-line>Adelaide, 5001</addr-line>
            <country>Australia</country>
            <phone>61 82013217</phone>
            <email>michael.sorich@flinders.edu.au</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1999-866X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Mangoni</surname>
            <given-names>Arduino Aleksander</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8699-1412</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Bacchi</surname>
            <given-names>Stephen</given-names>
          </name>
          <degrees>MBBS, PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5130-8628</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Menz</surname>
            <given-names>Bradley Douglas</given-names>
          </name>
          <degrees>BPharm</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0855-5081</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Hopkins</surname>
            <given-names>Ashley Mark</given-names>
          </name>
          <degrees>BPharm, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7652-4378</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>College of Medicine and Public Health</institution>
        <institution>Flinders University</institution>
        <addr-line>Adelaide</addr-line>
        <country>Australia</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Clinical Pharmacology</institution>
        <institution>Southern Adelaide Local Health Network</institution>
        <addr-line>Adelaide</addr-line>
        <country>Australia</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Neurology and the Center for Genomic Medicine</institution>
        <institution>Massachusetts General Hospital and Harvard Medical School</institution>
        <addr-line>Boston, MA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Michael Joseph Sorich <email>michael.sorich@flinders.edu.au</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>6</day>
        <month>12</month>
        <year>2024</year>
      </pub-date>
      <volume>26</volume>
      <elocation-id>e67409</elocation-id>
      <history>
        <date date-type="received">
          <day>10</day>
          <month>10</month>
          <year>2024</year>
        </date>
        <date date-type="rev-request">
          <day>4</day>
          <month>11</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>11</day>
          <month>11</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>13</day>
          <month>11</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Michael Joseph Sorich, Arduino Aleksander Mangoni, Stephen Bacchi, Bradley Douglas Menz, Ashley Mark Hopkins. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 06.12.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2024/1/e67409" xlink:type="simple"/>
      <kwd-group>
        <kwd>generative artificial intelligence</kwd>
        <kwd>large language models</kwd>
        <kwd>triage</kwd>
        <kwd>diagnosis</kwd>
        <kwd>accuracy</kwd>
        <kwd>physician</kwd>
        <kwd>ChatGPT</kwd>
        <kwd>diagnostic</kwd>
        <kwd>primary care</kwd>
        <kwd>physicians</kwd>
        <kwd>prediction</kwd>
        <kwd>medical care</kwd>
        <kwd>internet</kwd>
        <kwd>LLMs</kwd>
        <kwd>AI</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>The medical capabilities of large language models (LLMs) are progressing rapidly [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. Benchmarking LLMs against human performance with clinically relevant tasks enables tracking current capabilities and progress. The triage (level/urgency of care to seek) and diagnostic accuracy of the GPT-3 model were recently compared with 5000 lay individuals using the internet and 21 practicing primary care physicians [<xref ref-type="bibr" rid="ref4">4</xref>]. The triage ability of GPT-3 was significantly inferior to that of physicians, having similar accuracy to lay individuals. The diagnostic ability was close to but below that of physicians [<xref ref-type="bibr" rid="ref4">4</xref>]. It is uncertain whether more recent frontier LLMs are still inferior to physicians on this benchmark.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview</title>
        <p>The 48 case vignettes—including both common and severe conditions—validated by Levine and colleagues [<xref ref-type="bibr" rid="ref4">4</xref>] were evaluated using three LLMs that are typically highly ranked across diverse benchmarks: GPT-4o-2024-05-13 (OpenAI), Claude-3.5-Sonnet (Anthropic), and Gemini-1.5-Pro-001 (Google) via a Python application programming interface. The LLMs were instructed to identify potential diagnoses and provide step-by-step reasoning. Subsequently, they reflected on the reasoning and selected the top three diagnoses in order of likelihood. For triage prediction, the LLM was supplied with the vignette and the three diagnoses it predicted. It was instructed to identify the urgency of the required medical care, including its step-by-step reasoning.</p>
        <p>A multi-agent workflow involving collaboration between the three distinct LLMs was also evaluated (<xref rid="figure1" ref-type="fig">Figure 1</xref>). Each LLM was provided with its initial analysis (decision plus reasoning) and the analyses of the two other LLMs. Each LLM was instructed to reflect on all analyses and update its proposed diagnoses/triage as appropriate. The consensus decision (majority vote) was identified by an independent frontier LLM (Llama-3.1-405B; Meta) to avoid preferencing the output of a specific LLM.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Large language model (LLM) collaboration: a triage/diagnosis workflow involving initial analysis (the LLM’s initial decision and step-by-step reasoning), updated analysis (reflecting on all LLM initial analyses and updating decision if appropriate), and consensus decision (majority vote of the individual LLM’s updated decisions).</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e67409_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Diagnostic accuracy was evaluated by whether the correct diagnosis was one of the three proposed by the LLM (top 3) [<xref ref-type="bibr" rid="ref4">4</xref>]. Additionally, the accuracy of the first-ranked diagnosis (top 1) was assessed. Triage was assessed as urgent (emergency department or seeing a doctor within a day) versus nonurgent (seeing a doctor within a week or self-care) [<xref ref-type="bibr" rid="ref4">4</xref>]. The prompts and LLM settings are provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>This study involved a secondary analysis of publicly available synthetic case vignettes. No data on human participants were used. The research was undertaken with approval from the Flinders University Human Research Ethics Committee (project ID 7800).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>The correct diagnosis was among the top three proposed diagnoses for 98.6% (142/144; frontier LLMs) and 100% (48/48; LLM collaboration) of cases. Individually, the performance of GTP-4o, Claude-3.5-Sonnet, and Gemini-1.5-Pro was 98% (47/48), 100% (48/48), and 98% (47/48), respectively.</p>
      <p>The most likely diagnosis prediction was correct for 86.8% (125/144; frontier LLMs) and 98% (47/48; LLM collaboration) of cases. Individually, the performance of GTP-4o, Claude-3.5-Sonnet, and Gemini-1.5-Pro was 94% (45/48), 96% (46/48), and 71% (34/48), respectively.</p>
      <p>Triage was correct for 92.4% (133/144; frontier LLMs) and 92% (44/48; LLM collaboration) of cases. The most common error was overestimating the urgency. Individually, the performance of GTP-4o, Claude-3.5-Sonnet, and Gemini-1.5-Pro was 92% (44/48), 94% (45/48), and 92% (44/48), respectively.</p>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>Contemporary frontier LLMs have substantially improved performance compared to GPT-3 for diagnosis (top three: 142/144, 98.6% vs 42/48, 88%; top one: 125/144, 86.8% vs 31/48, 65%) and triage (133/144, 92.4% vs 34/48, 71%) [<xref ref-type="bibr" rid="ref4">4</xref>], highlighting the rapid progress in generative artificial intelligence performance. For diagnosis of these clinical vignettes, frontier LLMs performed similarly to physicians (top three: 142/144, 98.6% vs 637/666, 95.6%) [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
      <p>In triaging these clinical vignettes, frontier LLMs (133/144, 92.4%) now perform substantially better than lay individuals (3706/5000, 74.1%) who could use the internet (before the availability of LLMs) and similarly to primary care physicians (608/666, 91.3%) [<xref ref-type="bibr" rid="ref4">4</xref>]. This capability is consistent with recent evaluations of modern LLMs for emergency department triage [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. A limitation of this study is the relatively small sample size of cases evaluated. Given the encouraging performance of contemporary LLMs for triage assessment, future studies should assess whether LLMs allow lay individuals to make better triage decisions regarding the urgency of care they require.</p>
      <p>The rapid progress in LLM capabilities poses challenges for tracking their current capability for health-related tasks. This includes challenges for traditional peer-reviewed publications, which can become outdated by the time of publication.</p>
      <p>Additionally, we show that newer techniques involving collaboration between multiple distinct LLMs may improve diagnostic performance. However, this comes at the cost of adding operational complexity. Other methods, such as fine-tuning and in-context learning (eg, integrating search functionality and demonstrations of how to work through complex cases), offer opportunities to improve the performance of LLMs [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>].</p>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Settings and prompts used for large language models.</p>
        <media xlink:href="jmir_v26i1e67409_app1.docx" xlink:title="DOCX File , 18 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>MJS is supported by a Beat Cancer Research Fellowship from the Cancer Council South Australia. AMH holds an Emerging Leader Investigator Fellowship from the National Health and Medical Research Council, Australia (APP2008119). The PhD scholarship of BDM is supported by the National Health and Medical Research Council, Australia (APP2030913). The funders had no role in the design and conduct of the study; collection, management, analysis, and interpretation of the data; preparation, review, or approval of the manuscript; and decision to submit the manuscript for publication.</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The case vignettes used are publicly available [<xref ref-type="bibr" rid="ref4">4</xref>]. The prompts used are available in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="conflict">
        <p>MJS reported receiving grants from Pfizer, AstraZeneca, Boehringer Ingelheim, and the National Health and Medical Research Council of Australia outside the submitted work. AMH reported receiving grants from Boehringer Ingelheim, Hospital Research Foundation, Tour De Cure, and Flinders Foundation outside the submitted work. No other disclosures were reported.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nori</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>YT</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Carignan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Edgar</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Fusi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Can generalist foundation models outcompete special-purpose tuning? Case study in medicine</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on November 28, 2023</comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2311.16452</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saab</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>WH</given-names>
            </name>
            <name name-style="western">
              <surname>Tanno</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Stutz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wulczyn</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Capabilities of Gemini models in medicine</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on April 29, 2024</comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2404.18416</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sorich</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Menz</surname>
              <given-names>BD</given-names>
            </name>
            <name name-style="western">
              <surname>Hopkins</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Quality and safety of artificial intelligence generated health information</article-title>
          <source>BMJ</source>
          <year>2024</year>
          <month>03</month>
          <day>20</day>
          <volume>384</volume>
          <fpage>q596</fpage>
          <pub-id pub-id-type="doi">10.1136/bmj.q596</pub-id>
          <pub-id pub-id-type="medline">38508683</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Levine</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Tuwani</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kompa</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Varma</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Finlayson</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Mehrotra</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Beam</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>The diagnostic and triage accuracy of the GPT-3 artificial intelligence model: an observational study</article-title>
          <source>Lancet Digit Health</source>
          <year>2024</year>
          <month>08</month>
          <volume>6</volume>
          <issue>8</issue>
          <fpage>e555</fpage>
          <lpage>e561</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2589-7500(24)00097-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S2589-7500(24)00097-9</pub-id>
          <pub-id pub-id-type="medline">39059888</pub-id>
          <pub-id pub-id-type="pii">S2589-7500(24)00097-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>CYK</given-names>
            </name>
            <name name-style="western">
              <surname>Zack</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Miao</surname>
              <given-names>BY</given-names>
            </name>
            <name name-style="western">
              <surname>Sushil</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kornblith</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Butte</surname>
              <given-names>AJ</given-names>
            </name>
          </person-group>
          <article-title>Use of a large language model to assess clinical acuity of adults in the emergency department</article-title>
          <source>JAMA Netw Open</source>
          <year>2024</year>
          <month>05</month>
          <day>01</day>
          <volume>7</volume>
          <issue>5</issue>
          <fpage>e248895</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38713466"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2024.8895</pub-id>
          <pub-id pub-id-type="medline">38713466</pub-id>
          <pub-id pub-id-type="pii">2818387</pub-id>
          <pub-id pub-id-type="pmcid">PMC11077390</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Masanneck</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Seifert</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kölsche</surname>
              <given-names>Tristan</given-names>
            </name>
            <name name-style="western">
              <surname>Huntemann</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Jansen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mehsin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bernhard</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Meuth</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Böhm</surname>
              <given-names>Lennert</given-names>
            </name>
            <name name-style="western">
              <surname>Pawlitzki</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Triage performance across large language models, ChatGPT, and untrained doctors in emergency medicine: comparative study</article-title>
          <source>J Med Internet Res</source>
          <year>2024</year>
          <month>06</month>
          <day>14</day>
          <volume>26</volume>
          <fpage>e53297</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2024//e53297/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/53297</pub-id>
          <pub-id pub-id-type="medline">38875696</pub-id>
          <pub-id pub-id-type="pii">v26i1e53297</pub-id>
          <pub-id pub-id-type="pmcid">PMC11214027</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
