<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v28i1e73326</article-id>
      <article-id pub-id-type="pmid">41554120</article-id>
      <article-id pub-id-type="doi">10.2196/73326</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Evaluating and Validating Large Language Models for Health Education on Developmental Dysplasia of the Hip: 2-Phase Study With Expert Ratings and a Pilot Randomized Controlled Trial</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Sarvestan</surname>
            <given-names>Javad</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Zhang</surname>
            <given-names>Jun</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>de Alencar</surname>
            <given-names>Geisa Guimaraes</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Ouyang</surname>
            <given-names>Hui</given-names>
          </name>
          <degrees>MSN</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0007-1692-2391</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Lin</surname>
            <given-names>Gan</given-names>
          </name>
          <degrees>MSN</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0006-9034-5345</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Yiyuan</given-names>
          </name>
          <degrees>MSN</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0008-4903-2448</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Yao</surname>
            <given-names>Zhixin</given-names>
          </name>
          <degrees>MSN</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0000-6289-2452</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Yating</given-names>
          </name>
          <degrees>MSN</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0007-3800-7346</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Yan</surname>
            <given-names>Han</given-names>
          </name>
          <degrees>BSN</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0002-1257-6130</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Qin</surname>
            <given-names>Fang</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0005-0037-0102</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Yao</surname>
            <given-names>Jinghui</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4335-7232</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Yun</given-names>
          </name>
          <degrees>MM</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution/>
            <institution>Third Affiliated Hospital of Southern Medical University</institution>
            <addr-line>183 Zhongshan Road West</addr-line>
            <addr-line>Tianhe District</addr-line>
            <addr-line>Guangzhou, 510630</addr-line>
            <country>China</country>
            <phone>86 13724869220</phone>
            <email>chenyun88@smu.edu.cn</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0008-0169-3618</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Third Affiliated Hospital of Southern Medical University</institution>
        <addr-line>Guangzhou</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>School of Nursing</institution>
        <institution>Southern Medical University</institution>
        <addr-line>Guangzhou</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Pediatric Orthopedics</institution>
        <institution>Center for Orthopaedic Surgery</institution>
        <institution>Third Affiliated Hospital of Southern Medical University</institution>
        <addr-line>Guangzhou</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Yun Chen <email>chenyun88@smu.edu.cn</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2026</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>19</day>
        <month>1</month>
        <year>2026</year>
      </pub-date>
      <volume>28</volume>
      <elocation-id>e73326</elocation-id>
      <history>
        <date date-type="received">
          <day>29</day>
          <month>7</month>
          <year>2025</year>
        </date>
        <date date-type="rev-request">
          <day>29</day>
          <month>9</month>
          <year>2025</year>
        </date>
        <date date-type="accepted">
          <day>19</day>
          <month>12</month>
          <year>2025</year>
        </date>
      </history>
      <copyright-statement>©Hui Ouyang, Gan Lin, Yiyuan Li, Zhixin Yao, Yating Li, Han Yan, Fang Qin, Jinghui Yao, Yun Chen. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 19.01.2026.</copyright-statement>
      <copyright-year>2026</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2026/1/e73326" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Developmental dysplasia of the hip (DDH) is a common pediatric orthopedic disease, and health education is vital to disease management and rehabilitation. The emergence of large language models (LLMs) has provided new opportunities for health education. However, the effectiveness and applicability of LLMs in education with DDH have not been systematically evaluated.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study conducted an integrated 2-phase evaluation to assess the quality and educational effectiveness of LLM-generated educational materials.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>This study comprised 2 phases. Based on Bloom’s taxonomy, a 16-item DDH question bank was created through literature analysis and collaboration. Four LLMs (ChatGPT-4 [OpenAI], DeepSeek-V3, Gemini 2.0 Flash [Google], and Copilot [Microsoft Corp]) were questioned using standardized prompts. All responses were independently evaluated by 5 pediatric orthopedic experts using 5-point Likert measures of accuracy, fluency, and richness, the scales of Patient Education Materials Assessment Tool for Printable Materials, and DISCERN. The readability was measured by a formula. The data were examined using Kruskal-Wallis tests, ANOVA, and post hoc comparisons. In phase 2, an assessor-blinded, 2-arm pilot randomized controlled trial was conducted. A total of 127 caregivers were randomized into an LLM-assisted education group or a web search control group. The intervention included structured LLM training, supervised practice, and 2 weeks of reinforcement training. Measured at baseline, postintervention, and 2 weeks following, the outcomes were eHealth literacy (primary), DDH knowledge, health risk perception, perceived usefulness, information self-efficacy, and health information-seeking behavior. Cohen <italic>d</italic> effect sizes and linear mixed-effects models were used in an intention-to-treat manner.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>There were significant differences between the 4 LLMs concerning accuracy, richness, fluency, Patient Education Materials Assessment Tool for Printable Materials Understandability, and DISCERN (<italic>P</italic>&#60;.05). ChatGPT-4 (median 63.67, IQR 63.67-64.67) and DeepSeek-V3 (median 63.67, IQR 63.33-64.67) generate more accurate text than Copilot (median 59.00, IQR 58.67-59.67). DeepSeek-V3 (median 64.00, IQR 64.00-64.00) was language richer than Copilot (median 52.33, IQR 51.33-52.67). Gemini 2.0 Flash (median 72.67, IQR 72.33-73.00) was more fluent than Copilot (median 65.67, IQR 63.33-65.67). In phase 2, the intervention group showed higher eHealth literacy at T1 (33.62, 95% CI 32.76-34.49; <italic>d</italic>=0.20, 95% CI 0.13-0.56) and T2 (33.27, 95% CI 32.38-34.17; <italic>d</italic>=0.36, 95% CI 0.01-0.80), greater DDH knowledge at T1 (7.87, 95% CI 7.48-8.25, <italic>d</italic>=0.71, 95% CI 0.33-1.11) and T2 (7.12, 95% CI 6.72-7.51; <italic>d</italic>=0.54, 95% CI 0.17-0.96), and slight improvements in health risk prediction and perceived usefulness.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Mainstream LLMs demonstrate varying capacities in generating educational content for DDH. They generated DDH caregiver education materials that were associated with modest improvements in eHealth literacy and knowledge. Although LLMs can address general informational needs, they cannot completely substitute clinical evaluation. Future research should focus on optimizing plain language, refining dialogue design, and enhancing audience personalization to improve the quality of LLMs’ materials.</p>
        </sec>
        <sec sec-type="Trial Registration">
          <title>Trial Registration</title>
          <p>Chinese Clinical Trial Registry ChiCTR2500108410; https://www.chictr.org.cn/showproj.html?proj=271987</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>large language models</kwd>
        <kwd>developmental dysplasia of the hip</kwd>
        <kwd>health education</kwd>
        <kwd>content generation</kwd>
        <kwd>mobile phone</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Developmental dysplasia of the hip (DDH) is a common pediatric orthopedic condition affecting 1%-3% of infants, with a higher prevalence in girls and more frequent involvement of the left hip [<xref ref-type="bibr" rid="ref1">1</xref>]. If undiagnosed or untreated early, DDH can lead to gait abnormalities, chronic pain, and early osteoarthritis, substantially affecting the quality of life [<xref ref-type="bibr" rid="ref2">2</xref>]. Early diagnosis and health education are critical for improving prognosis. Delayed diagnosis and treatment often require complex surgery, which not only increases the difficulty of treatment but may also result in further functional deterioration [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. Traditional educational methods are limited by time and resources, making it difficult to meet patients’ diverse informational needs. The emergence of artificial intelligence (AI) has provided new opportunities for health education.</p>
        <p>In the broader field of digital health communication, AI-based conversational systems are increasingly being explored as tools to provide convenient and efficient services to meet people’s diverse needs. Currently, large language models (LLMs), such as ChatGPT, Google Gemini, Microsoft Copilot, and DeepSeek, are applied in health communication, including disease diagnosis [<xref ref-type="bibr" rid="ref5">5</xref>], treatment recommendation [<xref ref-type="bibr" rid="ref6">6</xref>], health education [<xref ref-type="bibr" rid="ref7">7</xref>], and clinical decision-making [<xref ref-type="bibr" rid="ref8">8</xref>]. For example, ChatGPT enables interactive discussions that tailor standardized medical information to individual patient needs, helping bridge communication gaps between clinicians and patients [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. Although AI has demonstrated great potential in medical education, its use in patient-facing communication raises concerns. LLMs may provide erroneous medical advice [<xref ref-type="bibr" rid="ref11">11</xref>], propagate outdated medical views [<xref ref-type="bibr" rid="ref12">12</xref>], or fabricate nonexistent medical cases to generate “hallucinations” [<xref ref-type="bibr" rid="ref13">13</xref>]. At the ethical and regulatory levels, challenges arise from the model’s “black box” decision-making, including unclear accountability, difficulties in defining legal responsibility, privacy breaches, and lagging regulatory frameworks. These issues directly jeopardize users’ safety, potentially leading to misdiagnosis, delayed treatment, and other forms of direct harm. Furthermore, most generated content maintains a university reading level, which may pose comprehension challenges for users without higher education [<xref ref-type="bibr" rid="ref14">14</xref>]. These risks underscore the need for systematic evaluation before integrating such tools into health education.</p>
        <p>While prior studies have primarily examined the accuracy or readability of LLM-generated content [<xref ref-type="bibr" rid="ref15">15</xref>], few have connected content quality with its actual educational impact on end users. The extent to which LLM-generated materials can effectively support caregivers’ understanding and health literacy in specific conditions, such as DDH, remains unexplored. In DDH, caregivers have to not only comprehend specialized medical concepts but also actively recognize abnormal signs in children and make timely decisions [<xref ref-type="bibr" rid="ref16">16</xref>]. Due to the professional complexity of orthopedic knowledge and the unique nature of pediatric disorders, basic health literacy abilities are necessary for caregivers. Therefore, the different levels of digital literacy among caregivers may make it more difficult for them to properly understand information produced by LLMs. To address this, the present study systematically evaluated multiple mainstream LLMs through expert assessment and a pilot randomized controlled trial (RCT) among caregivers. By integrating expert evaluation with caregiver validation, this study extends the current AI in health communication research from theoretical assessment to empirical verification.</p>
      </sec>
      <sec>
        <title>Objective</title>
        <p>Therefore, this study aimed to provide a comprehensive evaluation and verification of LLM-generated education materials for DDH. The first phase assessed the educational quality of the outputs generated by 4 mainstream LLMs (ChatGPT-4, DeepSeek-V3, Gemini 2.0 Flash, and Copilot) through expert ratings of accuracy, understandability, actionability, and readability. The second phase involved a pilot RCT among caregivers to evaluate the actual educational impact of these materials, including digital literacy, DDH knowledge acquisition, health risk perception, information self-efficacy, perceived usefulness, and health information-seeking behaviors. This study bridged the gap by integrating the quality assessment of LLMs with RCT to validate their content reliability and educational impact. It offered evidence for the safe and effective use of LLMs in clinical education.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Theoretical Framework</title>
        <p>The taxonomy by Bloom et al [<xref ref-type="bibr" rid="ref17">17</xref>] served as the guiding pedagogical framework for designing the educational content. The taxonomy organizes cognitive processes into 6 hierarchical levels: remember, understand, apply, analyze, evaluate, and create, which is widely used to structure learning objectives and instructional materials. As users often need to acquire not only basic factual knowledge but also practical decision-making skills, this hierarchical model provided a structured approach for determining which levels of cognition should be targeted in education [<xref ref-type="bibr" rid="ref18">18</xref>].</p>
        <p>Guided by this framework, we developed a 16-item question bank that intentionally spanned different cognitive levels, ranging from foundational knowledge such as definitions and symptoms to more complex tasks such as interpreting clinical scenarios or making care decisions (<xref ref-type="table" rid="table1">Table 1</xref>). This ensured that the LLM-generated responses covered the breadth of learning needs relevant to caregivers. Bloom’s taxonomy, therefore, supported the construction of a comprehensive and pedagogically meaningful learning set, helping align the generated content with education requirements.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Question bank framework based on Bloom’s taxonomy.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="270"/>
            <col width="0"/>
            <col width="700"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Bloom’s taxonomy and part</td>
                <td>Content</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="4">
                  <bold>Remembering</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Basics</td>
                <td colspan="2">“What is [disease name]? Please explain its main features and potential effects in simple language.”</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Anatomy and effects</td>
                <td colspan="2">“Who is most likely to develop [disease name]? How common is it?”</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Understanding</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Etiology and risk factors</td>
                <td colspan="2">“Will [disease name] have a long-term impact on my quality of life? What aspects should I pay special attention to?”</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Symptoms and early recognition</td>
                <td colspan="2">“What parts of the body does [disease name] mainly affect? What do these parts do in a healthy state?”</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Applying</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Physician examination and diagnosis</td>
                <td colspan="2">“What symptoms or consequences may arise if these parts are damaged? Can you provide specific examples?”</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Emergencies</td>
                <td colspan="2">“What are the main causes of [disease name]? What risk factors may increase the chances of developing it?”</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Analyzing</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hospital treatment and rehabilitation</td>
                <td colspan="2">“What lifestyle habits or environmental factors increase the risk of developing [disease name]? How can I prevent it?”</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Medication management</td>
                <td colspan="2">“If I have a family history, is my risk of developing [disease name] higher? What preventive measures should I take?”</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Pain management</td>
                <td colspan="2">“What are the main symptoms of [disease name]? What signs indicate the disease is worsening? Should I seek immediate medical attention?”</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Evaluating</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Postoperative management</td>
                <td colspan="2">“What methods do doctors usually use to confirm the diagnosis of [disease name]? What is the purpose of each test?”</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Creating</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Daily living and health management</td>
                <td colspan="2">“What indicators are most important in test results? How do these results reflect the severity of the disease?”</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Mental health</td>
                <td colspan="2">“After confirming the diagnosis of [disease name], do I need to schedule regular follow-ups? How often should I have them and what should be checked?”</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Digital tools and management</td>
                <td colspan="2">“What symptoms indicate that I need to seek immediate medical attention?”</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Expanding<sup>a</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Education and support resources</td>
                <td colspan="2">“How should I handle and self-monitor during an emergency situation?”</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Social and economic impact</td>
                <td colspan="2">“What treatments will I receive during hospitalization? What is the purpose of each treatment?”</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Future planning and visioning</td>
                <td colspan="2">“How can I prevent infections or other complications during hospitalization? What can family members do to assist with recovery?”</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Not part of Bloom’s taxonomy; it is an extension of this study.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Study Design</title>
        <p>The evaluation study had 2 phases. Phase 1 was a cross-sectional study in which physicians evaluated the answers provided by the LLMs. Phase 2 was a 2-arm pilot RCT comparing health education using LLMs with web-based searches.</p>
      </sec>
      <sec>
        <title>Phase 1: Expert Evaluation Study</title>
        <sec>
          <title>Model Testing</title>
          <p>Based on Bloom’s taxonomy, we collected and categorized common questions regarding DDH. We also reviewed clinical guidelines [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref23">23</xref>] to identify the key areas of knowledge. Using this information, an initial question bank was developed, which was subsequently refined and finalized through expert review. Each question was guided by a harmonized prompt paragraph: “Using developmental dysplasia of the hip (DDH) in children as an example, answer the following questions in detail, ensuring the content is easily understandable for non-medical professionals. Life-like examples and situations can be incorporated to help readers better grasp the information. Please reduce the number of syllables to make the sentence simpler.” All the generated texts and the complete question bank are provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Each model generated educational materials based on 16 question banks, and the experiment was repeated 3 times for a total of 192 generations (4 models × 16 question banks × 3 times). Data were collected from January to February 2025. ChatGPT-4, DeepSeek-V3, Gemini 2.0 Flash, and Copilot were evaluated; no experimental, beta, or preview releases were included. The experiments were performed under the default settings of the web interfaces without modifying the generation parameters. To ensure reproducibility and independence of the outputs, each prompt was regenerated 3 times by establishing a new session for each run with the same original prompt. All outputs, including identical or similar responses, were retained to reflect the intrinsic variability of the models.</p>
        </sec>
        <sec>
          <title>Assessment of Quality and Readability</title>
          <p>Quality assessment tools as primary outcomes included (1) a Likert scale for assessing three items of accuracy, fluency, and richness of the material, scoring 16 questions on a scale from 1 to 5, with higher scores indicating better performance; (2) the DISCERN tool [<xref ref-type="bibr" rid="ref24">24</xref>], which assessed the overall quality of the educational material, with a total of 16 entries, scoring on a scale from 1 to 5, with higher scores indicating better quality; and (3) the Patient Education Materials Assessment Tool for Printable Materials (PEMAT-P) [<xref ref-type="bibr" rid="ref25">25</xref>], which contains 17 items measuring understandability and 7 items assessing actionability. These were reduced to 10 and 4 to accommodate the textual output with a 70% passing line based on the guidelines. During the evaluation process, each material was independently scored by 5 evaluators. The scores from evaluators were retained for subsequent data analysis.</p>
          <p>Readability assessment tools as secondary outcomes included (1) the Flesch-Kincaid Reading Ease (FKRE), (2) the Flesch-Kincaid Grade Level (FKGL), and (3) the Simple Measure of Gobbledygook (SMOG) index, chosen for their widespread use and reliability in assessing text readability. All 3 score calculations involved the total number of words, sentences, and syllables. The FKRE measured the simplicity of the text, with scores ranging from 0 to 100, with higher scores indicating better readability. The FKGL represented reading level grade, with lower FKGL and SMOG indicating better comprehension and higher scores indicating more complex language. Scores above 60 or below sixth grade were the recommended reading levels for the general public. Readability scores were calculated using a web-based readability calculator (Readable; Added Bytes). The detailed formulas are provided in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
        </sec>
        <sec>
          <title>Expert Evaluation</title>
          <p>The material generated by the LLMs was independently assessed for quality. The material generated by the LLMs was independently assessed by 5 pediatric orthopedic physicians with expertise in DDH, selected through rigorous predefined criteria: (1) ≥10 years of clinical experience in DDH diagnosis or treatment; and (2) evaluators completed standardized training on the assessment rubric before this study, using the DDH guidelines as the gold standard [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref23">23</xref>]. To ensure blinding, the LLM outputs were made anonymous by an independent researcher who replaced the model names with random codes. The evaluators confirmed that they could not infer the identities of the LLMs or determine if repeated outputs came from the same model. Interrater reliability was assessed for each outcome dimension using the intraclass correlation coefficient (ICC). ICC values were interpreted as follows: &#60;0.5=poor, 0.5-0.75=moderate, 0.75-0.9=good, and &#62;0.9=excellent agreement.</p>
        </sec>
      </sec>
      <sec>
        <title>Phase 2: Pilot RCT</title>
        <sec>
          <title>Participants</title>
          <p>Participants were recruited through digital media advertisements and physician referrals. Eligibility criteria included (1) being aged ≥18 years, (2) being caregivers of children aged 0-14 years, (3) having the ability to read and understand words, and (4) having internet access. Exclusion criteria included (1) having severe hearing or visual impairment; (2) having severe schizophrenia, major depression, bipolar disorder, and other mental illnesses; or (3) participation in other related studies.</p>
        </sec>
        <sec>
          <title>Sample Size</title>
          <p>Power analysis was performed using G*Power 3.1.9.7 based on similar educational intervention studies [<xref ref-type="bibr" rid="ref26">26</xref>]. A medium effect size (Cohen <italic>d</italic>=0.65) was anticipated for the primary outcome of performance, with 2-tailed α=.05, power of 0.8, and at least 38 participants per group being required. Accounting for an expected 20% attrition rate, the target sample was 49 participants per group (total n=98). There were 127 participants in the final sample (62 in the control group and 65 in the intervention group).</p>
        </sec>
        <sec>
          <title>Randomization and Blinding</title>
          <p>Recruitment took place in the Third Affiliated Hospital of Southern Medical University and community support groups. The researchers generated a computer-generated list and sealed it in an opaque envelope. Before the start of the intervention, research assistants who were not involved in hospital assessments or interventions opened the envelopes and assigned participants at random to the intervention or control group. Following informed consent, eligible participants meeting the inclusion and exclusion criteria were randomly assigned in a 1:1 ratio to either the trial or control group. The blinding of participants was not feasible due to the nature of the intervention, but the research team remained unaware of group assignments until this study concluded. Data analysts who conducted the final analyses were masked to participant identities throughout. Due to the nature of the intervention, participant blinding was not possible. However, group allocations were not disclosed to the research team until the trial was finished. Throughout, participant identities were concealed from the data analysts.</p>
        </sec>
        <sec>
          <title>Control Group</title>
          <p>Participants in the control group received standard web-based educational materials prepared by clinical experts. These materials were retrieved from official sources (eg, [<xref ref-type="bibr" rid="ref27">27</xref>]). Participants were asked to read independently, simulating a typical web-based health information-seeking behavior.</p>
        </sec>
        <sec>
          <title>Intervention Group</title>
          <p>All researchers received standardized training to ensure consistent delivery of DDH-related information and LLM education. The intervention was delivered to participants by face-to-face communication. First, the participants were introduced to the foundational concepts of LLMs, including basic mechanisms, application categories, and core interaction capabilities. Second, a standardized consultation framework was introduced, covering device access, platform login, dialogue initiation, and structured prompt formulation. The required background information included demographic and clinical characteristics, symptom description, disease duration, medical history, lifestyle, and psychosocial factors. Participants were also provided with 16 DDH-related inquiry categories, including foundations, risk factors, early recognition, diagnosis, treatment, postoperative care, medication management, psychological support, etc. They are able to optionally output custom instructions, such as length, style, level of technical terminology, and formatting preferences. Third, strategies to improve information quality are introduced, including clear language prompts, staged questions, example guidance, support for the reasoning process, evidence sources for web retrieval, and document import. Verification approaches were emphasized, such as cross-model comparison, guideline checking, and professional consultation. Finally, risk awareness and ethical considerations were reinforced, including potential hallucinations, outdated content, privacy risks, copyright issues, and inappropriate clinical dependence. A practical demonstration was conducted using an actual DDH case. For example, a female infant, 1 year old, with asymmetric thigh folds and a family history, but no medical history. Participants inquired and learned relevant knowledge based on the background of this example. During the 2 weeks, the participants received remote support through web-based group consultations or offline feedback sessions. Researchers responded to questions related to practical application, corrected misuse behaviors, and supplemented individualized guidance.</p>
        </sec>
        <sec>
          <title>Data Collection</title>
          <p>Data were collected through questionnaire surveys. The basic information questionnaire gathered the demographic characteristics of this study’s participants. Validated scales were used to measure eHealth literacy, DDH knowledge, health risk perception, information self-efficacy, perceived usefulness, and health information-seeking behavior. There were three assessment time points: (1) baseline (T0), (2) immediately after the completion of the intervention or control group (T1), and (3) two weeks after the end of the intervention or control group (T2).</p>
        </sec>
        <sec>
          <title>Primary Outcomes</title>
          <p>The eHealth Literacy Scale (eHEALS), originally developed by Norman and Skinner [<xref ref-type="bibr" rid="ref28">28</xref>], was adopted to measure participants’ eHealth literacy. It comprises 8 items that assess one’s ability to locate and use web-based health resources, appraise the credibility of digital health information, and apply acquired information to make informed health decisions. Each item is scored on a 5-point Likert scale, producing a total score between 8 and 40, with higher scores representing stronger eHealth literacy.</p>
        </sec>
        <sec>
          <title>Secondary Outcomes</title>
          <p>The developmental dysplasia of the hip knowledge test (DDH-KT) was developed by the research team to assess participants’ basic DDH knowledge. The items were constructed according to current clinical guidelines and health education materials and reviewed by pediatric orthopedic surgeons. Each correct answer is scored as 1 point (range 0-10), with higher scores indicating greater DDH knowledge. The full knowledge test is provided in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>.</p>
          <p>The Health Risk Perception Scale (HRPS) was measured based on the framework by Ajzen [<xref ref-type="bibr" rid="ref29">29</xref>]. The scale was adapted from established health risk perception measures by Brewer et al [<xref ref-type="bibr" rid="ref30">30</xref>], and covered 2 dimensions: perceived susceptibility and perceived severity. The items assessed participants’ subjective perception of the likelihood and potential consequences of related health problems, rated on a 5-point Likert scale. Higher scores reflected a greater level of perceived risk (Cronbach α=0.847).</p>
          <p>The Information Self-Efficacy Scale (ISES), adapted from Pavlou and Fygenson [<xref ref-type="bibr" rid="ref31">31</xref>], was used to evaluate participants’ confidence in obtaining and effectively using web-based health information. The scale contained 3 items rated on a 5-point Likert scale. Total scores were calculated by summing all item responses, with higher scores indicating stronger information self-efficacy (Cronbach α=0.806).</p>
          <p>The Perceived Usefulness Scale (PUS), adapted from Cheung et al [<xref ref-type="bibr" rid="ref32">32</xref>], assessed the extent to which participants viewed web-based health information as helpful, relevant, and beneficial for health knowledge and decision-making. Items were scored on a 5-point Likert scale, with higher scores indicating greater perceived usefulness (Cronbach α=0.852).</p>
          <p>The Health Information-Seeking Behavior Scale (HISBS), adapted from Kankanhalli et al [<xref ref-type="bibr" rid="ref33">33</xref>], measured the frequency and willingness to actively seek web-based health information. Responses were recorded using a 5-point Likert scale, and higher scores indicated more proactive seeking behavior (Cronbach α=0.873).</p>
        </sec>
      </sec>
      <sec>
        <title>Statistical Analysis</title>
        <p>In phase 1, descriptive statistics were reported as mean (SD) and median (IQR). Because the final analytic values were obtained by averaging 3 generations, the normality assumptions for repeated-measures ANOVA were not met. Group differences among the 4 LLMs were analyzed using the Kruskal-Wallis H test, followed by Dunn-Bonferroni post hoc comparisons when significant. One-way ANOVA and Tukey post hoc tests were used for readability indices because the normality assumptions were satisfied. False discovery rate correction was applied across the 9 outcomes to control for multiple testing. Interrater reliability was assessed using ICC(2,k) based on a 2-way random-effects model [<xref ref-type="bibr" rid="ref34">34</xref>]. Effect sizes were reported as epsilon-squared for nonparametric tests and eta-squared for ANOVA. Analyses were conducted in R (version 4.5.1; R Foundation) with ggplot2 (version 3.5.1; Posit, PBC) for visualization.</p>
        <p>In phase 2, all analyses followed the intention-to-treat principle and included all randomized participants. Continuous baseline variables are presented as mean (SD), and categorical variables as counts and percentages. Differences between groups at baseline were assessed using 2-sided independent sample <italic>t</italic> tests for continuous variables and chi-square tests for categorical variables. Outcomes were analyzed using linear mixed-effects models with time (T1 and T2) and group (intervention vs control) as fixed effects, time × group interaction, baseline (T0) as a covariate, and participant ID as a random intercept. No imputation was performed because linear mixed-effects models estimated with restricted maximum likelihood provided unbiased estimates under the missing at random assumption [<xref ref-type="bibr" rid="ref35">35</xref>]. Between-group effect sizes (Cohen <italic>d</italic>, 95% CI) and estimated marginal means (95% CI) were reported. eHEALS was defined as the primary outcome. All other outcomes, including DDH-KT, HRPS, ISES, PUS, and HISBS, were considered secondary. Given the pilot and exploratory nature of this trial, no adjustment for multiple comparisons was applied. Therefore, analyses of the outcomes were intended to be hypothesis-generating rather than confirmatory. Analyses were conducted in R (version 4.5.1) using lme4, lmerTest, and emmeans; 2-sided <italic>P</italic>&#60;.05 was considered statistically significant.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>This study was approved by the Ethics Committee of the Third Affiliated Hospital of Southern Medical University (2024-ER-113), and the first participant was enrolled in June 2025. The trial registration was completed on August 29, 2025, at the Chinese Clinical Trial Registry (ChiCTR2500108410). All research participants signed written informed consent forms. Researchers disclosed study information to participants; participants retained the right to withdraw from the study or withdraw their research data at any time without conditions, and withdrawal would not result in any adverse consequences. Participants were informed that part of the educational content was generated by AI, and the limitations of AI-generated information were explained. The use of AI-assisted materials was supervised throughout this study by qualified health care professionals. During the intervention period, participants were encouraged to report any concerns or adverse experiences related to the educational materials, and ultimately, no related adverse events were reported. All personal information and data collected during the study were kept strictly confidential. Participants who completed the entire study process received educational materials, including a parenting knowledge handbook valued at CN ¥50 RMB (approximately US $7.15), as compensation.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Phase 1</title>
        <sec>
          <title>Overview</title>
          <p>Overall, ChatGPT-4 and DeepSeek-V3 demonstrated the strongest performance in content accuracy, richness, understandability, and information quality, making them suitable for generating pediatric health communication materials. Gemini 2.0 Flash and Copilot performed well in fluency and readability metrics, while they were relatively weaker in content richness and accuracy. <xref ref-type="table" rid="table2">Table 2</xref> provides a visual summary of the scores and the overall performance comparison. <xref rid="figure1" ref-type="fig">Figure 1</xref> illustrates the comparison of the responses across the LLMs. The scoring data are presented in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>.</p>
          <table-wrap position="float" id="table2">
            <label>Table 2</label>
            <caption>
              <p>Comparison of model performance across different indicators.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="200"/>
              <col width="100"/>
              <col width="0"/>
              <col width="150"/>
              <col width="90"/>
              <col width="90"/>
              <col width="130"/>
              <col width="90"/>
              <col width="120"/>
              <thead>
                <tr valign="top">
                  <td colspan="2">Model</td>
                  <td>Mean (SD)</td>
                  <td colspan="2">Median (IQR)</td>
                  <td>H/F<sup>a</sup></td>
                  <td><italic>P</italic> value</td>
                  <td>FDR-adjusted<sup>b</sup> <italic>P</italic> value</td>
                  <td>ε²<sup>c</sup>/η²<sup>d</sup></td>
                  <td>Significance (<italic>P</italic> value)</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="2">
                    <bold>Accuracy</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>13.873</td>
                  <td>.003</td>
                  <td>.005</td>
                  <td>0.73</td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ChatGPT-4</td>
                  <td colspan="2">64 (1.03)</td>
                  <td>63.67 (63.67-64.67)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>*<sup>e,f</sup> (.02)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Copilot</td>
                  <td colspan="2">59.07 (1.01)</td>
                  <td>59.00 (58.67-59.67)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>*<sup>g</sup> (.048)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>DeepSeek-V3</td>
                  <td colspan="2">63.33 (1.78)</td>
                  <td>63.67 (63.33-64.67)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—<sup>h</sup></td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Gemini 2.0 Flash</td>
                  <td colspan="2">59.53 (0.99)</td>
                  <td>59.67 (59.33-60.00)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <bold>Richness</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>13.68</td>
                  <td>.003</td>
                  <td>.005</td>
                  <td>0.72</td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ChatGPT-4</td>
                  <td colspan="2">62.33 (2.26)</td>
                  <td>62.67 (60.00-64.33)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Copilot</td>
                  <td colspan="2">51.6 (3.52)</td>
                  <td>52.33 (51.33-52.67)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>*<sup>g</sup> (.02)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>DeepSeek-V3</td>
                  <td colspan="2">63.93 (1.53)</td>
                  <td>64.00 (64.00-64.00)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Gemini 2.0 Flash</td>
                  <td colspan="2">54 (5.65)</td>
                  <td>54.67 (50.33-57.33)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <bold>Fluency</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>16.204</td>
                  <td>.001</td>
                  <td>.003</td>
                  <td>0.853</td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ChatGPT-4</td>
                  <td colspan="2">69.53 (1.19)</td>
                  <td>70.00 (68.67-70.00)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Copilot</td>
                  <td colspan="2">64.87 (1.8)</td>
                  <td>65.67 (63.33-65.67)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>***<sup>i</sup> (&#60;.001)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>DeepSeek-V3</td>
                  <td colspan="2">69.87 (2.19)</td>
                  <td>70.67 (70.33-71.00)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Gemini 2.0 Flash</td>
                  <td colspan="2">73 (0.97)</td>
                  <td>72.67 (72.33-73.00)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <bold>PEMAT-P<sup>j</sup> understandability (%)</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>11.421</td>
                  <td>.01</td>
                  <td>.012</td>
                  <td>0.601</td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ChatGPT-4</td>
                  <td colspan="2">93.89 (1.24)</td>
                  <td>94.44 (94.44-94.44)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>*<sup>f</sup> (.03)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Copilot</td>
                  <td colspan="2">85 (4.21)</td>
                  <td>86.11 (80.56-88.89)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>DeepSeek-V3</td>
                  <td colspan="2">93.33 (3.17)</td>
                  <td>94.44 (91.67-94.44)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Gemini 2.0 Flash</td>
                  <td colspan="2">87.78 (4.21)</td>
                  <td>86.11 (86.11-88.89)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td> —</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <bold>PEMAT-P actionability (%)</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>7.587</td>
                  <td>.06</td>
                  <td>.06</td>
                  <td>0.399</td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ChatGPT-4</td>
                  <td colspan="2">68.33 (3.73)</td>
                  <td>66.67 (66.67-66.67)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Copilot</td>
                  <td colspan="2">60 (6.97)</td>
                  <td>58.33 (58.33-66.67)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>DeepSeek-V3</td>
                  <td colspan="2">68.33 (3.73)</td>
                  <td>66.67 (66.67-66.67)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Gemini 2.0 Flash</td>
                  <td colspan="2">66.67 (5.89)</td>
                  <td>66.67 (66.67-66.67)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <bold>DISCERN</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>10.243</td>
                  <td>.02</td>
                  <td>.02</td>
                  <td>0.539</td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ChatGPT-4</td>
                  <td colspan="2">48.52 (3.27)</td>
                  <td>49.00 (46.00-49.27)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>*<sup>i</sup> (.035)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Copilot</td>
                  <td colspan="2">46.56 (1.57)</td>
                  <td>46.67 (46.47-47.67)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>DeepSeek-V3</td>
                  <td colspan="2">48.44 (2.71)</td>
                  <td>48.00 (46.67-49.20)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>*<sup>i</sup> (.03)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Gemini 2.0 Flash</td>
                  <td colspan="2">43.08 (1.82)</td>
                  <td>43.33 (42.33-43.40)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <bold>FKGL<sup>k</sup></bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>8.395</td>
                  <td>&#60;.001</td>
                  <td>.003</td>
                  <td>0.296</td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ChatGPT-4</td>
                  <td colspan="2">8.74 (1.37)</td>
                  <td>8.86 (8.14-9.70)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>*<sup>g</sup> (.03); *<sup>i</sup> (.04)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Copilot</td>
                  <td colspan="2">9.41 (1.86)</td>
                  <td>9.07 (8.38-10.88)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>***<sup>g</sup> (&#60;.001); ***<sup>i</sup> (&#60;.001)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>DeepSeek-V3</td>
                  <td colspan="2">7.30 (1.08)</td>
                  <td>7.26 (6.72-7.70)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Gemini 2.0 Flash</td>
                  <td colspan="2">7.37 (1.33)</td>
                  <td>7.19 (6.30-8.44)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <bold>FKRE<sup>l</sup></bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>14.198</td>
                  <td>.003</td>
                  <td>.005</td>
                  <td>0.225</td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ChatGPT-4</td>
                  <td colspan="2">61.86 (8.58)</td>
                  <td>61.44 (56.80-66.97)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Copilot</td>
                  <td colspan="2">53.45 (12.62)</td>
                  <td>57.70 (46.25-61.33)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>**<sup>g</sup> (.006); **<sup>i</sup> (.009)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>DeepSeek-V3</td>
                  <td colspan="2">67.19 (6.62)</td>
                  <td>67.45 (62.73-70.43)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Gemini 2.0 Flash</td>
                  <td colspan="2">66.85 (7.72)</td>
                  <td>70.10 (59.19-73.48)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <bold>SMOG<sup>m</sup></bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>8.297</td>
                  <td>&#60;.001</td>
                  <td>.003</td>
                  <td>0.293</td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ChatGPT-4</td>
                  <td colspan="2">11.02 (1.26)</td>
                  <td>10.96 (10.52-11.61)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>*<sup>g</sup> (.02)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Copilot</td>
                  <td colspan="2">11.67 (1.33)</td>
                  <td>11.48 (11.09-13.04)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>***<sup>g</sup> (&#60;.001); **<sup>i</sup> (.003)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>DeepSeek-V3</td>
                  <td colspan="2">9.83 (0.93)</td>
                  <td>9.74 (9.25-10.19)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Gemini 2.0 Flash</td>
                  <td colspan="2">10.19 (1.06)</td>
                  <td>10.03 (9.28-10.91)</td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>—</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table2fn1">
                <p><sup>a</sup>H/F: values are reported as test statistics. H statistics for the Kruskal-Wallis test and <italic>F</italic> statistics for 1-way ANOVA.</p>
              </fn>
              <fn id="table2fn2">
                <p><sup>b</sup>FDR: false discovery rate.</p>
              </fn>
              <fn id="table2fn3">
                <p><sup>c</sup>η²: eta-squared.</p>
              </fn>
              <fn id="table2fn4">
                <p><sup>d</sup>ε²: epsilon-squared.</p>
              </fn>
              <fn id="table2fn5">
                <p><sup>e</sup><bold>*</bold><italic>P</italic> &#60;.05. **<italic>P</italic> &#60;.01. <bold>*</bold>**<italic>P</italic> &#60;.001. Normality was assessed for all variables. FKGL and SMOG were analyzed using 1-way ANOVA with Tukey honestly significant difference for pairwise comparisons; others were analyzed using the Kruskal-Wallis test with Dunn test (Bonferroni-corrected <italic>P</italic> values).</p>
              </fn>
              <fn id="table2fn6">
                <p><sup>f</sup>vs CoPilot.</p>
              </fn>
              <fn id="table2fn7">
                <p><sup>g</sup>vs DeePseek-V3.</p>
              </fn>
              <fn id="table2fn8">
                <p><sup>h</sup>Not applicable.</p>
              </fn>
              <fn id="table2fn9">
                <p><sup>i</sup>vs Gemini 2.0 Flash.</p>
              </fn>
              <fn id="table2fn10">
                <p><sup>j</sup>PEMAT-P: Patient Education Materials Assessment Tool for Printable Materials.</p>
              </fn>
              <fn id="table2fn11">
                <p><sup>k</sup>FKGL: Flesch-Kincaid Grade Level.</p>
              </fn>
              <fn id="table2fn12">
                <p><sup>l</sup>FKRE: Flesch-Kincaid Reading Ease.</p>
              </fn>
              <fn id="table2fn13">
                <p><sup>m</sup>SMOG: Simple Measure of Gobbledygook.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <fig id="figure1" position="float">
            <label>Figure 1</label>
            <caption>
              <p>Comparison of responses across 4 LLMs. (A) Accuracy, (B) richness, (C) fluency, (D) PEMAT-P understandability, (E) PEMAT-P actionability, (F) DISCERN, (G) FKGL, (H) FKRE, and (I) SMOG index. FKGL: Flesch-Kincaid Grade Level; FKRE: Flesch-Kincaid Reading Ease; LLM: large language model; PEMAT-P: Patient Education Materials Assessment Tool for Printable Materials; SMOG: Simple Measure of Gobbledygook.</p>
            </caption>
            <graphic xlink:href="jmir_v28i1e73326_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Quality Assessment</title>
          <p>There were significant differences between the 4 LLMs in terms of accuracy, richness, fluency, PEMAT-P understandability, and DISCERN (<italic>P</italic>&#60;.05). ChatGPT-4 and DeepSeek-V3 outperformed the other models in the majority of evaluation dimensions. ChatGPT-4 (median 63.67, IQR 63.67-64.67) and DeepSeek-V3 (median 63.67, IQR 63.33-64.67) generated more accurate text than Copilot (median 59.00, IQR 58.67-59.67). DeepSeek-V3 (median 64.00, IQR 64.00-64.00) was language richer than Copilot (median 52.33, IQR 51.33-52.67). Gemini 2.0 Flash (median 72.67, IQR 72.33-73.00) was more fluent than Copilot (median 65.67, IQR 63.33-65.67). Based on the PEMAT-P understandability scores, the content of ChatGPT-4 (median 94.44%, IQR 94.44%-94.44%) was more comprehensible than that of Copilot (median 86.11%, IQR 80.56%-88.89%). The PEMAT-P actionability scores were similar across the models. ChatGPT-4 (median 49.00, IQR 46.00-49.27) and DeepSeek-V3 (median 48.00, IQR 46.67-49.20) had a higher DISCERN scale score than Gemini 2.0 Flash (median 43.33, IQR 42.33-43.40).</p>
        </sec>
        <sec>
          <title>Readability Assessment</title>
          <p>Readability metrics highlighted the differences among the models. Gemini 2.0 Flash (median 66.85, IQR 59.19-73.48) and DeepSeek-V3 (median 67.19, IQR 62.73-70.43) generated sentences with higher FKRE scores, indicating easier readability compared to Copilot (median 53.45, IQR 46.25-61.33). DeepSeek-V3 (mean 7.30, SD 1.08) and Gemini 2.0 Flash (mean 7.37, SD 1.33) produced sentences with superior FKGL scores compared to ChatGPT-4 (mean 8.74, SD 1.37) and Copilot (mean 9.41, SD 1.86). DeepSeek-V3 (mean 9.83, SD 0.93) and Gemini 2.0 Flash (mean 10.19, SD 1.06) produced texts with better SMOG scores compared to ChatGPT-4 (mean 11.02, SD 1.26) and Copilot (mean 11.67, SD 1.33).</p>
        </sec>
        <sec>
          <title>Visualization and Analysis</title>
          <p>The comparative evaluation of 4 LLMs demonstrated clear performance variability across accuracy, richness, and fluency, as illustrated in <xref rid="figure2" ref-type="fig">Figures 2</xref> and <xref rid="figure3" ref-type="fig">3</xref>. Overall, ChatGPT-4 and DeepSeek-V3 outperformed Copilot and Gemini Flash, particularly in accuracy and fluency. In terms of accuracy, the proportion of “good” and “excellent” responses reached 85% for ChatGPT-4 and 83% for DeepSeek-V3, while Gemini 2.0 Flash (70%) and Copilot (66%) displayed a lower proportion. Regarding richness, DeepSeek-V3 (83%) and ChatGPT-4 (81%) again ranked highest, reflecting strong supplementary and explanatory capability, whereas the other 2 models showed as more concise. Across fluency, all 4 models delivered strong information elaboration, with Gemini 2.0 Flash achieving the highest proportion of 96%, indicating strong coherence, readability, and natural language expression.</p>
          <p>As shown in the heatmap (<xref rid="figure3" ref-type="fig">Figure 3</xref>), ChatGPT-4 and DeepSeek-V3 yielded higher mean scores across most knowledge domains, particularly in basic, effects, and symptoms. In contrast, Copilot and Gemini 2.0 Flash performed worse, especially in specialized domains such as medication management and postoperative care. These results suggested that current LLMs perform well in general health education content but remain limited in clinically nuanced and actionable information.</p>
          <p>Across the 4 models and 6 evaluation dimensions, the interrater reliability among the 5 evaluators ranged from moderate to excellent (ICC=0.628-0.918). <xref ref-type="table" rid="table3">Table 3</xref> shows the interrater reliability results across the 4 LLMs and evaluation dimensions based on ICC.</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Expert Likert-scale ratings of content quality across 4 LLMs. LLM: large language model.</p>
            </caption>
            <graphic xlink:href="jmir_v28i1e73326_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Multidimensional performance evaluation heatmap for LLMs. Heatmap showing mean scores of 4 LLMs across accuracy, richness, fluency, and readability dimensions. Higher scores are represented by warmer colors. FRES: Flesch-Kincaid Reading Ease; LLM: large language model.</p>
            </caption>
            <graphic xlink:href="jmir_v28i1e73326_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <table-wrap position="float" id="table3">
            <label>Table 3</label>
            <caption>
              <p>Results of expert consistency analysis.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="320"/>
              <col width="100"/>
              <col width="150"/>
              <col width="150"/>
              <col width="100"/>
              <col width="150"/>
              <col width="0"/>
              <thead>
                <tr valign="top">
                  <td colspan="2">Dimension</td>
                  <td>ICC<sup>a,b</sup></td>
                  <td>95% CI</td>
                  <td><italic>F</italic> test (<italic>df</italic>)</td>
                  <td><italic>P</italic> value</td>
                  <td colspan="2">Interpretation</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="7">
                    <bold>Accuracy</bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ChatGPT-4</td>
                  <td>0.851</td>
                  <td>0.695-0.941</td>
                  <td>6.734 (15, 60)</td>
                  <td>&#60;.001</td>
                  <td colspan="2">Good</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Copilot</td>
                  <td>0.654</td>
                  <td>0.277-0.864</td>
                  <td>2.810 (15, 60)</td>
                  <td>.002</td>
                  <td colspan="2">Moderate</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>DeepSeek-V3</td>
                  <td>0.904</td>
                  <td>0.803-0.962</td>
                  <td>11.510 (15, 60)</td>
                  <td>&#60;.001</td>
                  <td colspan="2">Excellent</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Gemini 2.0 Flash</td>
                  <td>0.727</td>
                  <td>0.433-0.892</td>
                  <td>3.565 (15, 60)</td>
                  <td>&#60;.001</td>
                  <td colspan="2">Moderate</td>
                </tr>
                <tr valign="top">
                  <td colspan="8">
                    <bold>Richness</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ChatGPT-4</td>
                  <td>0.669</td>
                  <td>0.352-0.864</td>
                  <td>3.499 (15, 60)</td>
                  <td>&#60;.001</td>
                  <td colspan="2">Moderate</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Copilot</td>
                  <td>0.834</td>
                  <td>0.652-0.934</td>
                  <td>7.750 (15, 60)</td>
                  <td>&#60;.001</td>
                  <td colspan="2">Good</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>DeepSeek-V3</td>
                  <td>0.747</td>
                  <td>0.481-0.899</td>
                  <td>3.944 (15, 60)</td>
                  <td>.001</td>
                  <td colspan="2">Moderate</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Gemini 2.0 Flash</td>
                  <td>0.628</td>
                  <td>0.285-0.845</td>
                  <td>3.515 (15, 60)</td>
                  <td>&#60;.001</td>
                  <td colspan="2">Moderate</td>
                </tr>
                <tr valign="top">
                  <td colspan="8">
                    <bold>Fluency</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>ChatGPT-4</td>
                  <td>0.914</td>
                  <td>0.825-0.966</td>
                  <td>11.931 (15, 60)</td>
                  <td>&#60;.001</td>
                  <td colspan="2">Excellent</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Copilot</td>
                  <td>0.918</td>
                  <td>0.833-0.967</td>
                  <td>13.244 (15, 60)</td>
                  <td>&#60;.001</td>
                  <td colspan="2">Excellent</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>DeepSeek-V3</td>
                  <td>0.835</td>
                  <td>0.664-0.934</td>
                  <td>6.223 (15, 60)</td>
                  <td>&#60;.001</td>
                  <td colspan="2">Good</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Gemini 2.0 Flash</td>
                  <td>0.876</td>
                  <td>0.746-0.951</td>
                  <td>8.038 (15, 60)</td>
                  <td>&#60;.001</td>
                  <td colspan="2">Good</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">PEMAT-P<sup>c</sup> understandability</td>
                  <td>0.874</td>
                  <td>0.482-0.991</td>
                  <td>7.833 (3, 12)</td>
                  <td>.004</td>
                  <td colspan="2">Good</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">PEMAT-P actionability</td>
                  <td>0.718</td>
                  <td>0.050-0.980</td>
                  <td>3.858 (3, 12)</td>
                  <td>.038</td>
                  <td colspan="2">Moderate</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">DISCERN</td>
                  <td>0.819</td>
                  <td>0.358-0.986</td>
                  <td>12.473 (3, 12)</td>
                  <td>.001</td>
                  <td colspan="2">Good</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table3fn1">
                <p><sup>a</sup>ICC: intraclass correlation coefficient.</p>
              </fn>
              <fn id="table3fn2">
                <p><sup>b</sup>Type A intraclass correlation coefficient using an absolute agreement definition.</p>
              </fn>
              <fn id="table3fn3">
                <p><sup>c</sup>PEMAT-P: Patient Education Materials Assessment Tool for Printable Materials.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
      </sec>
      <sec>
        <title>Phase 2</title>
        <sec>
          <title>Participant Characteristics</title>
          <p>Participants were recruited from June 2025 to September 2025. A total of 127 participants were enrolled in this study, including 65 in the intervention group and 62 in the control group. <xref rid="figure4" ref-type="fig">Figure 4</xref> shows the CONSORT (Consolidated Standards of Reporting Trials) flowchart, and the CONSORT-EHEALTH (Consolidated Standards of Reporting Trials of Electronic and Mobile Health Applications and Online Telehealth) checklist is presented in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>. Most participants completed the intervention, and the main reason for withdrawal was lack of time. Participants had a mean age of 36.57 (SD 6.22) years, and most were female (89/127, 70.07%) and highly educated (55/127, 43.31%). The mean age of participants’ children was 5.90 (SD 3.12) years. No significant differences were observed between the intervention and control groups in the baseline characteristics (<italic>P</italic>&#62;.05). During this study, no privacy breaches, technical failures, or other unintended events were observed. <xref ref-type="table" rid="table4">Table 4</xref> summarizes the demographic characteristics of the participants. The data of participants can be found in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>.</p>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>CONSORT diagram of study flow. CONSORT: Consolidated Standards of Reporting Trials.</p>
            </caption>
            <graphic xlink:href="jmir_v28i1e73326_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <table-wrap position="float" id="table4">
            <label>Table 4</label>
            <caption>
              <p>Baseline characteristics.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="270"/>
              <col width="0"/>
              <col width="150"/>
              <col width="0"/>
              <col width="250"/>
              <col width="0"/>
              <col width="200"/>
              <col width="0"/>
              <col width="0"/>
              <col width="100"/>
              <thead>
                <tr valign="top">
                  <td colspan="3">Background characteristic</td>
                  <td colspan="2">Overall</td>
                  <td colspan="2">Intervention group (n=65)</td>
                  <td colspan="2">Control group (n=62)</td>
                  <td colspan="2"><italic>P</italic> value</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="3">Age (years), mean (SD)</td>
                  <td colspan="2">36.57 (6.22)</td>
                  <td colspan="2">37.06 (5.68)</td>
                  <td colspan="2">36.05 (6.74)</td>
                  <td colspan="2">.14</td>
                </tr>
                <tr valign="top">
                  <td colspan="10">
                    <bold>Sex, n (%)</bold>
                  </td>
                  <td>.83</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Female</td>
                  <td colspan="2">89 (70.08)</td>
                  <td colspan="2">45 (69.23)</td>
                  <td colspan="2">44 (70.97)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Male</td>
                  <td colspan="2">38 (29.92)</td>
                  <td colspan="2">20 (30.77)</td>
                  <td colspan="2">18 (29.03)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td colspan="10">
                    <bold>Education, n (%)</bold>
                  </td>
                  <td>.92</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Low education</td>
                  <td colspan="2">18 (14.17)</td>
                  <td colspan="2">11 (16.92)</td>
                  <td colspan="2">7 (11.29)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Medium education</td>
                  <td colspan="2">54 (42.52)</td>
                  <td colspan="2">27 (41.54)</td>
                  <td colspan="2">27 (43.55)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>High education</td>
                  <td colspan="2">55 (43.31)</td>
                  <td colspan="2">27 (41.54)</td>
                  <td colspan="2">28 (45.16)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td colspan="10">
                    <bold>Monthly income (CN ¥), n (%)</bold>
                  </td>
                  <td>.85</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>≤3000 (US $429.12)</td>
                  <td colspan="2">9 (7.09)</td>
                  <td colspan="2">30 (61.2)</td>
                  <td colspan="2">35 (71.4)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>3001-6000 (US $429.26-US $858.23)</td>
                  <td colspan="2">26 (20.47)</td>
                  <td colspan="2">19 (38.8)</td>
                  <td colspan="2">14 (28.6)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>6001-10,000 (US $858.38-US $1430.39)</td>
                  <td colspan="2">42 (33.07)</td>
                  <td colspan="2">21 (33.87)</td>
                  <td colspan="2">21 (32.31)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>10,001-20,000 (US $1430.53-US $2860.78)</td>
                  <td colspan="2">36 (28.35)</td>
                  <td colspan="2">19 (30.65)</td>
                  <td colspan="2">17 (26.15)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>≥20,001 (US $2860.92)</td>
                  <td colspan="2">14 (11.02)</td>
                  <td colspan="2">7 (11.29)</td>
                  <td colspan="2">7 (10.77)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td colspan="10">
                    <bold>Child’s gender, n (%)</bold>
                  </td>
                  <td>.23</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Male</td>
                  <td colspan="2">71 (55.91)</td>
                  <td colspan="2">32 (49.23)</td>
                  <td colspan="2">24 (38.71)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Female</td>
                  <td colspan="2">56 (44.09)</td>
                  <td colspan="2">33 (50.77)</td>
                  <td colspan="2">38 (61.29)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td colspan="3">Child’s age (years), mean (SD)</td>
                  <td colspan="2">5.90 (3.12)</td>
                  <td colspan="2">6.39 (3.36)</td>
                  <td colspan="2">5.39 (2.78)</td>
                  <td colspan="2">.06</td>
                </tr>
                <tr valign="top">
                  <td colspan="10">
                    <bold>Daily caregiving time for the child (hours/day), n (%)</bold>
                  </td>
                  <td>.37</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>≤2</td>
                  <td colspan="2">17 (13.39)</td>
                  <td colspan="2">11 (16.92)</td>
                  <td colspan="2">6 (9.68)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>3-6</td>
                  <td colspan="2">55 (43.31)</td>
                  <td colspan="2">27 (41.54)</td>
                  <td colspan="2">28 (45.16)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>6-9</td>
                  <td colspan="2">16 (12.6)</td>
                  <td colspan="2">7 (10.77)</td>
                  <td colspan="2">9 (14.52)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>9-12</td>
                  <td colspan="2">15 (11.81)</td>
                  <td colspan="2">6 (9.23)</td>
                  <td colspan="2">9 (14.52)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>≥12</td>
                  <td colspan="2">24 (18.9)</td>
                  <td colspan="2">14 (21.54)</td>
                  <td colspan="2">10 (16.13)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td colspan="10">
                    <bold>Smartphone proficiency, n (%)</bold>
                  </td>
                  <td>.53</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Very proficient</td>
                  <td colspan="2">66 (51.97)</td>
                  <td colspan="2">33 (50.77)</td>
                  <td colspan="2">33 (53.23)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Basic proficient</td>
                  <td colspan="2">22 (17.33)</td>
                  <td colspan="2">14 (21.54)</td>
                  <td colspan="2">8 (12.9)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Fairly proficient</td>
                  <td colspan="2">33 (25.98)</td>
                  <td colspan="2">15 (23.08)</td>
                  <td colspan="2">18 (29.03)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Not proficient</td>
                  <td colspan="2">6 (4.72)</td>
                  <td colspan="2">3 (4.62)</td>
                  <td colspan="2">3 (4.84)</td>
                  <td colspan="3">
                    <break/>
                  </td>
                </tr>
              </tbody>
            </table>
          </table-wrap>
        </sec>
        <sec>
          <title>Primary Outcome</title>
          <p>The group × time interaction in eHEALS was not significant (<italic>P</italic>=.26). The intervention group showed higher scores than the control group at T1 (33.62, 95% CI 32.76-34.49; <italic>d</italic>=0.20, 95% CI 0.13-0.56) and T2 (33.27, 95% CI 32.38-34.17; <italic>d</italic>=0.36, 95% CI 0.01-0.80), indicating sustained improvements following the LLM-generated learning intervention. <xref ref-type="table" rid="table5">Table 5</xref> reports the means estimated from the model and the contrasts between groups across the specified time points; <xref rid="figure5" ref-type="fig">Figure 5</xref> graphically illustrates the outcomes overtime by condition.</p>
          <table-wrap position="float" id="table5">
            <label>Table 5</label>
            <caption>
              <p>Change in outcomes.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="120"/>
              <col width="150"/>
              <col width="150"/>
              <col width="150"/>
              <col width="100"/>
              <col width="0"/>
              <col width="150"/>
              <col width="0"/>
              <col width="150"/>
              <thead>
                <tr valign="top">
                  <td colspan="2">Time</td>
                  <td>Control EMM<sup>a</sup> (95% CI)</td>
                  <td>Intervention EMM (95% CI)</td>
                  <td colspan="3">Group difference</td>
                  <td colspan="2">Cohen <italic>d</italic> (95% CI)</td>
                  <td>Group × time interaction, <italic>P</italic> value</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>β (95% CI)</td>
                  <td>SE</td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="2">
                    <bold>eHEALS<sup>b</sup></bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td colspan="2">.26</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T0</td>
                  <td>29.23 (28.05 to 30.40)</td>
                  <td>27.91 (26.24 to 29.57)</td>
                  <td>—<sup>c</sup></td>
                  <td>—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T1</td>
                  <td>31.89 (31.01 to 32.77)</td>
                  <td>33.62 (32.76 to 34.49)</td>
                  <td>1.73 (0.49 to 2.97)</td>
                  <td>0.63</td>
                  <td colspan="2">0.20 (0.13 to 0.56)</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T2</td>
                  <td>30.87 (29.97 to 31.78)</td>
                  <td>33.27 (32.38 to 34.17)</td>
                  <td>2.40 (1.13 to 3.67)</td>
                  <td>0.65</td>
                  <td colspan="2">0.36 (0.01 to 0.80)</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <bold>DDH-KT<sup>d</sup></bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td colspan="2">.66</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T0</td>
                  <td>4.42 (3.92 to 4.92)</td>
                  <td>4.31 (3.87 to 4.74)</td>
                  <td>—</td>
                  <td>—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T1</td>
                  <td>6.65 (6.26 to 7.05)</td>
                  <td>7.87 (7.48 to 8.25)</td>
                  <td>1.22 (0.67 to 1.77)</td>
                  <td>0.28</td>
                  <td colspan="2">0.71 (0.33 to 1.11)</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T2</td>
                  <td>6.02 (5.62 to 6.42)</td>
                  <td>7.12 (6.72 to 7.51)</td>
                  <td>1.10 (0.53 to 1.66)</td>
                  <td>0.29</td>
                  <td colspan="2">0.54 (0.17 to 0.96)</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <bold>HRPS<sup>e</sup></bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td colspan="2">.25</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T0</td>
                  <td>27.60 (26.22 to 28.97)</td>
                  <td>27.20 (25.71 to 28.69)</td>
                  <td>—</td>
                  <td>—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T1</td>
                  <td>29.39 (28.33 to 30.45)</td>
                  <td>32.23 (31.19 to 33.26)</td>
                  <td>2.84 (1.36 to 4.31)</td>
                  <td>0.75</td>
                  <td colspan="2">0.50 (0.12 to 0.86)</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T2</td>
                  <td>29.48 (28.40 to 30.56)</td>
                  <td>31.55 (30.49 to 32.61)</td>
                  <td>2.07 (0.56 to 3.59)</td>
                  <td>0.77</td>
                  <td colspan="2">0.41 (0.05 to 0.79)</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <bold>ISES<sup>f</sup></bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td colspan="2">.25</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T0</td>
                  <td>11.53 (10.99 to 12.08)</td>
                  <td>10.94 (10.30 to 11.58)</td>
                  <td>—</td>
                  <td>—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T1</td>
                  <td>12.38 (12.00 to 12.77)</td>
                  <td>12.59 (12.22 to 12.97)</td>
                  <td>0.21 (–0.33 to 0.75)</td>
                  <td>0.27</td>
                  <td colspan="2">0.04 (0.30 to 0.39)</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T2</td>
                  <td>11.96 (11.56 to 12.35)</td>
                  <td>12.51 (12.12 to 12.90)</td>
                  <td>0.55 (–0.00 to 1.11)</td>
                  <td>0.28</td>
                  <td colspan="2">0.17 (0.19 to 0.55)</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <bold>PUS<sup>g</sup></bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td colspan="2">.48</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T0</td>
                  <td>15.03 (14.27 to 15.80)</td>
                  <td>14.12 (13.29 to 14.96)</td>
                  <td>—</td>
                  <td>—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T1</td>
                  <td>15.93 (15.40 to 16.46)</td>
                  <td>16.70 (16.18 to 17.21)</td>
                  <td>0.77 (0.02 to 1.51)</td>
                  <td>0.38</td>
                  <td colspan="2">0.11 (0.22 to 0.49)</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T2</td>
                  <td>15.61 (15.06 to 16.15)</td>
                  <td>16.66 (16.12 to 17.20)</td>
                  <td>1.05 (0.28 to 1.82)</td>
                  <td>0.39</td>
                  <td colspan="2">0.15 (0.19 to 0.51)</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <bold>HISBS<sup>h</sup></bold>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td colspan="2">.96</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T0</td>
                  <td>14.15 (13.50 to 14.79)</td>
                  <td>13.15 (12.34 to 13.97)</td>
                  <td>—</td>
                  <td>—</td>
                  <td colspan="2">—</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T1</td>
                  <td>15.68 (15.10 to 16.27)</td>
                  <td>16.15 (15.57 to 16.72)</td>
                  <td>0.46 (–0.36 to 1.28)</td>
                  <td>0.42</td>
                  <td colspan="2">0.02 (0.32 to 0.39)</td>
                  <td colspan="2">—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T2</td>
                  <td>15.23 (14.63 to 15.83)</td>
                  <td>15.67 (15.08 to 16.26)</td>
                  <td>0.44 (–0.40 to 1.28)</td>
                  <td>0.43</td>
                  <td colspan="2">0.05 (0.33 to 0.41)</td>
                  <td colspan="2">—</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table5fn1">
                <p><sup>a</sup>EMM: estimated marginal mean.</p>
              </fn>
              <fn id="table5fn2">
                <p><sup>b</sup>eHEALS: eHealth Literacy Scale.</p>
              </fn>
              <fn id="table5fn3">
                <p><sup>c</sup>Not applicable.</p>
              </fn>
              <fn id="table5fn4">
                <p><sup>d</sup>DDH-KT: developmental dysplasia of the hip knowledge test.</p>
              </fn>
              <fn id="table5fn5">
                <p><sup>e</sup>HRPS: Health Risk Perception Scale.</p>
              </fn>
              <fn id="table5fn6">
                <p><sup>f</sup>ISES: Information Self-Efficacy Scale.</p>
              </fn>
              <fn id="table5fn7">
                <p><sup>g</sup>PUS: Perceived Usefulness Scale.</p>
              </fn>
              <fn id="table5fn8">
                <p><sup>h</sup>HISBS: Health Information-Seeking Behavior Scale.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <fig id="figure5" position="float">
            <label>Figure 5</label>
            <caption>
              <p>Changes in outcomes over time by groups. (A) eHEALS (primary outcome), (B) DDH-KT, (C) HRPS, (D) ISES, (E) PUS, and (F) HISBS (secondary outcomes). DDH-KT: developmental dysplasia of the hip knowledge test; eHEALS: eHealth Literacy Scale; HISBS: Health Information-Seeking Behavior Scale; HRPS: Health Risk Perception Scale; ISES: Information Self-Efficacy Scale; PUS: Perceived Usefulness Scale.</p>
            </caption>
            <graphic xlink:href="jmir_v28i1e73326_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Secondary Outcomes</title>
          <p>All secondary outcomes reported nonsignificant group × time interactions (<italic>P</italic>&#62;.2), while the intervention group benefited from small to moderate impact sizes. DDH-KT scores were higher in the intervention group at T1 (7.87, 95% CI 7.48-8.25; <italic>d</italic>=0.71, 95% CI 0.33-1.11) and T2 (7.12, 95% CI 6.72-7.51; <italic>d</italic>=0.54, 95% CI 0.17-0.96). HRPS scores showed a similar pattern at T1 (32.23, 95% CI 31.19-33.26; <italic>d</italic>=0.50, 95% CI 0.12-0.86) and T2 (31.55, 95% CI 30.49-32.61; <italic>d</italic>=0.41, 95% CI 0.05-0.79). Additionally, PUS demonstrated consistent and statistically meaningful between-group differences favoring the intervention group at both T1 (16.70, 95% CI 16.18-17.21; <italic>d</italic>=0.11, 95% CI 0.22-0.49) and T2 (16.66, 95% CI 16.12-17.20; <italic>d</italic>=0.15, 95% CI 0.19-0.51). ISES and HISBS scores showed comparable positive trends; however, there were little differences across the groups.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This study evaluated the performance of 4 mainstream LLMs in education content and validated the effectiveness of LLM-generated caregiver education interventions. All 4 models demonstrated robust capabilities in generating content. ChatGPT-4 and DeepSeek-V3 outperformed Copilot and Gemini Flash in accuracy and fluency. The pilot trial suggests that LLM-assisted education may be associated with modest improvements in eHealth literacy (the primary outcome) and DDH knowledge compared with web-based searches; however, these findings should be interpreted as exploratory rather than confirmatory. These findings suggested that LLM-generated content was a feasible supplementary approach for health education. Its effectiveness appears to be enhanced when structured instruction and guided use are provided.</p>
      </sec>
      <sec>
        <title>LLMs Performance</title>
        <p>Overall, ChatGPT-4 performed well across several dimensions. It excelled in producing content that was logically clear and linguistically fluent. ChatGPT-4 was widely suitable for tasks with moderate complexity. DeepSeek-V3 was ideal for generating complex health education content, especially for requiring depth and professionalism. Gemini 2.0 Flash excelled in fluency and readability but had minor deficits in richness and accuracy. Its concise content is suitable for quick-reference scenarios. Gemini 2.0 Flash was useful for quickly accessing information. However, it was limited in tasks requiring depth. Its design focuses on simplicity and efficiency, suitable for everyday consultations or simple questioning and answering, and other low-complexity tasks. Copilot performed weakly in several dimensions, with omissions in its generated content and slightly obscure language expressions. It was suitable for tasks that require lower content quality.</p>
        <p>All 4 LLMs scored at or above the neutral threshold (≥3/5) for accuracy, richness, and fluency. PEMAT-P understandability ≥70% indicated that basic comprehension standards were met. However, their PEMAT-P actionability was limited. This limitation may reduce the utility of LLM-generated handouts for guiding caregiver decisions. Only Copilot provides source citations, which raises concerns about the traceability and reliability of the information. Although readability levels were close to the average reading level of US adults (eighth grade) [<xref ref-type="bibr" rid="ref36">36</xref>], they still exceeded American Medical Association recommendations (no more than sixth grade) for health education materials [<xref ref-type="bibr" rid="ref37">37</xref>]. Nevertheless, the current web-based health education materials for orthopedic specialties were less than this recommendation [<xref ref-type="bibr" rid="ref38">38</xref>]. This gap suggests that the readability of content generated by LLMs within the prompt framework has improved, but needs to be further optimized for the health education materials [<xref ref-type="bibr" rid="ref39">39</xref>].</p>
        <p>Based on publicly available official documentation and technical reports, the observed performance differences among the evaluated LLMs may be attributed to variations in training data, architectural design, and optimization objectives. ChatGPT-4 is described as a transformer-based multimodal model trained on a mixture of public and licensed data and aligned through supervised fine-tuning and reinforcement learning from human feedback. DeepSeek-V3 uses a mixture-of-experts architecture and large-scale pretraining, which may favor long-form generation and information coverage, helping explain its more comprehensive outputs. Gemini 2.0 Flash emphasizes efficiency and interaction speed, suggesting an optimization trade-off that supports fluency and readability but may constrain depth under limited prompting. Copilot functions as a product-level system rather than a fixed foundation model, with outputs influenced by orchestration layers and underlying model routing that can vary over time. Overall, these findings indicate that suitability for caregiver-oriented health education depends on how training data, architecture, and optimization priorities align with specific educational goals, rather than on overall model capability alone.</p>
      </sec>
      <sec>
        <title>Evaluation Indicators</title>
        <p>In practice, AI-assisted learning was associated with modest improvements in caregivers’ eHealth literacy and DDH knowledge compared with unguided web-based searches. This encouraged the educational value of using LLM-generated content. Short-term exposure did not significantly increase self-efficacy or active information-seeking behavior. This observation was consistent with behavioral science evidence. It emphasized that knowledge improvement was insufficient to drive behavioral change without supportive motivation, confidence, and environmental reinforcement. Lasting behavioral changes may require longer reinforcement, repeated exposure, environmental support, or clinician guidance. Although content generated by advanced models was more accurate and detailed, caregivers generally preferred concise, readable materials over lengthy or overly technical texts. This indicated that optimal education required balancing accuracy, conciseness, and clarity, rather than solely pursuing information richness.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>Prior studies had mostly evaluated a single LLM using a limited set of metrics. For instance, ChatGPT-3.5’s responses to spinal surgery questions were assessed solely for accuracy and readability [<xref ref-type="bibr" rid="ref40">40</xref>]. This study extended previous research by systematically comparing 4 mainstream LLMs under identical conditions. We included expert ratings (accuracy, richness, and fluency), standardized assessment instruments (Patient Education Materials Assessment Tool and DISCERN), readability metrics, and learning outcomes. By connecting content quality to user learning outcomes, our study provided a more comprehensive and clinically relevant assessment of LLMs for health education. Based on prior teaching improvements using Bloom’s taxonomy [<xref ref-type="bibr" rid="ref41">41</xref>], it was used to improve the education by applying an organized method to content created by LLM. Prior studies showed that LLMs such as ChatGPT can enhance information accessibility, support communication and decision-making, and reduce anxiety levels [<xref ref-type="bibr" rid="ref42">42</xref>]. These benefits have been demonstrated across diverse clinical contexts, including cancer care, orthopedic surgery, and mental health interventions [<xref ref-type="bibr" rid="ref43">43</xref>-<xref ref-type="bibr" rid="ref45">45</xref>]. The study reported that chatbot-enhanced prenatal education improved knowledge more effectively than standard mobile applications [<xref ref-type="bibr" rid="ref46">46</xref>]. Our findings supported these findings by showing significant improvements in caregivers’ eHealth literacy and knowledge of DDH. We focused more on enhancing eHealth literacy than on specific disease knowledge. This competency was essential not only for acquiring medical knowledge but also for enabling users to properly browse and use AI solutions across varied health information demands. Given that AI systems offer more flexible, interactive, and context-adaptive support than internet search, higher levels of eHealth literacy are necessary to ensure their safe and optimal use.</p>
        <p>LLMs were characterized by actual-time dialogue, instant feedback, and personalized communication. These features enhanced user engagement during health education processes, thereby improving knowledge acquisition [<xref ref-type="bibr" rid="ref44">44</xref>]. Participants in the intervention group demonstrated significantly higher health-risk perception than those in the web-based group, showing that personalized AI-generated information increases perceived relevance and strengthens risk understanding. Additionally, the immediate responses and conversational interactivity of LLMs maintained user attention more effectively than static web-based information [<xref ref-type="bibr" rid="ref47">47</xref>]. It resulted in increased satisfaction and maintained engagement.</p>
        <p>Despite these advantages, some studies identified notable limitations in the accuracy and completeness of LLM outputs. McMahon and McMahon [<xref ref-type="bibr" rid="ref48">48</xref>] warned that ChatGPT may generate misleading or unsafe recommendations in sensitive scenarios such as medication abortion. Ponzo et al [<xref ref-type="bibr" rid="ref49">49</xref>] demonstrated that ChatGPT often produced incomplete or inconsistent dietary advice requiring professional revision. This pattern aligned with our heat-map analysis: LLMs performed the best in descriptive but worst in requiring clinical reasoning, procedural detail, or latest guideline recommendations, such as medication management, postoperative instructions, and emergency decision-making. These weaknesses appeared across multiple medical specialties and reflected broader constraints [<xref ref-type="bibr" rid="ref50">50</xref>], including incomplete clinical training data, generating actionable guidance, and the universal LLMs’ inherent cautious tendency. Thus, caregivers using AI-assisted information retrieval still require oversight and guidance from health care professionals [<xref ref-type="bibr" rid="ref51">51</xref>].</p>
      </sec>
      <sec>
        <title>Study Limitations</title>
        <p>There are still some limitations to this study. First, although expert evaluation is an essential component of content quality assessment, it may carry the risk of subjective bias. Second, the evaluation was based on responses to a limited set of common DDH-related prompts. The variety and complexity of actual caregiver inquiries might not be adequately captured by such a limited selection of prompts. Third, each question was only created 3 times because of limitations on model use and study feasibility. Estimates of model variability would be more stable with more repetitions. Fourth, each LLM’s web-based interface characteristics were standardized. It may cause slight differences when compared to the normal interaction situations of actual users. Finally, because LLMs undergo frequent updates and iterative changes, the findings of this study reflect model performance during the specific access period and may not fully generalize to future versions.</p>
      </sec>
      <sec>
        <title>Practical Implications and Future Recommendations</title>
        <p>The 2-stage results suggest that LLMs have potential as accessible, cost-effective, and personalized educational tools for caregivers, particularly in settings where traditional health education resources are limited. AI may supplement traditional clinician education by automating repetitive informational tasks, thereby alleviating health care professionals’ workload and allowing them to prioritize complex clinical cases. Enhancing knowledge and timely medical consultation are especially important for the early recognition of DDH. In rural and remote places with inadequate medical services, LLMs may help minimize geographic and economic obstacles to health education, increasing educational reach [<xref ref-type="bibr" rid="ref52">52</xref>].</p>
        <p>The perceived utility of AI-generated content is not solely determined by technical accuracy. Although ChatGPT-4 and DeepSeek-V3 generated high-quality content, users do not always prefer longer or more detailed responses. Caregivers, especially older adults, often prefer concise and clear information [<xref ref-type="bibr" rid="ref53">53</xref>]. It suggests that instructional design should balance content quality with readability. Accordingly, when incorporating LLMs into clinical education, health educators may consider structured prompting and staged content generation. Instructional design might begin with simple explanations. As users express interest, gradually provide more specialized information with a guided summary.</p>
        <p>However, the risks of misinformation, hallucinations, and unclear accountability cannot be ignored. LLM outputs exhibit inherent uncertainty; responses can vary across conversational contexts and may produce plausible but inaccurate statements regarding diagnostic thresholds or guideline-specific recommendations [<xref ref-type="bibr" rid="ref54">54</xref>]. Furthermore, potential biases in training data may limit the cultural and contextual adaptability of these models [<xref ref-type="bibr" rid="ref55">55</xref>]. As they may inadvertently reflect high-resource health care assumptions while overlooking local beliefs, language nuances, or service availability. Therefore, to ensure safe use, LLMs should be positioned strictly as auxiliary tools rather than substitutes for comprehensive medical assessments, physical examinations, and consultations with health care professionals [<xref ref-type="bibr" rid="ref56">56</xref>]. In clinical practice, data confidentiality must be treated as a primary prerequisite. Patients provide informed consent for the use of LLM-assisted education, and workflows explicitly discourage the entry or disclosure of identifiable personal information [<xref ref-type="bibr" rid="ref57">57</xref>]. Professional monitoring is crucial because LLM-generated content can be ambiguous, erroneous, or prejudiced. This includes regular evaluation of AI-generated educational outputs, bias-aware checks, and escalation procedures when high-risk issues emerge [<xref ref-type="bibr" rid="ref58">58</xref>]. Future implementation strategies include retrieval-augmented generation, expert review mechanisms, and standardized safety and regulatory frameworks. With these safeguards, systematic incorporation of LLMs into health care procedures may support standardized health education and improve efficiency and scalability without compromising safety [<xref ref-type="bibr" rid="ref59">59</xref>]. Future work should also identify the support resources required for safe adoption, including staff training, governance and auditing procedures, and technical infrastructure. Therefore, LLMs hold potential to support future health education and clinical communication.</p>
      </sec>
      <sec>
        <title>Implications for Practice</title>
        <p>The implications for practice are that we (1) prefer models that cite reliable sources, (2) use prompts that request guideline-based advice, (3) always include disclaimers clarifying that LLMs cannot replace professional consultation, (4) target ≤6th-grade readability and simplify outputs with follow-up prompts, and (5) review and adapt content before sharing with patients.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This study demonstrates that LLMs hold substantial potential for supporting education in DDH. ChatGPT-4 achieved 85% accuracy and 93% fluency, while DeepSeek-V3 led in 83% richness, generally outperforming the Copilot and Gemini 2.0 Flash. AI-assisted education was associated with small to moderate effect sizes for caregivers’ eHealth literacy, DDH knowledge, health risk perception, and perceived usefulness compared with web-based searches in this pilot trial. In addition, this study applied Bloom’s Taxonomy as a guiding pedagogical framework to structure the LLM-generated DDH educational content. This approach allowed the content to support the spectrum of caregiver learning needs, extending from foundational knowledge acquisition to decision-oriented guidance. Study limitations include potential expert subjectivity, a narrow prompt set with few generations, and controlled interface settings. LLMs are auxiliary tools and cannot replace the need for professionals. Future research should focus on optimizing plain language, refining dialogue design, and enhancing audience personalization to improve the quality of materials generated by LLMs.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Question bank and generated data.</p>
        <media xlink:href="jmir_v28i1e73326_app1.docx" xlink:title="DOCX File , 303 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Formulas for evaluating readability.</p>
        <media xlink:href="jmir_v28i1e73326_app2.docx" xlink:title="DOCX File , 38 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>DDH knowledge test. DDH: developmental dysplasia of the hip.</p>
        <media xlink:href="jmir_v28i1e73326_app3.docx" xlink:title="DOCX File , 17 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Phase 1 scoring data.</p>
        <media xlink:href="jmir_v28i1e73326_app4.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 55 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>CONSORT-eHEALTH checklist (V 1.6.1).</p>
        <media xlink:href="jmir_v28i1e73326_app5.pdf" xlink:title="PDF File  (Adobe PDF File), 2774 KB"/>
      </supplementary-material>
      <supplementary-material id="app6">
        <label>Multimedia Appendix 6</label>
        <p>Phase 2 participants' scoring data.</p>
        <media xlink:href="jmir_v28i1e73326_app6.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 31 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CONSORT</term>
          <def>
            <p>Consolidated Standards of Reporting Trials</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CONSORT-EHEALTH</term>
          <def>
            <p>Consolidated Standards of Reporting Trials of Electronic and Mobile Health Applications and Online Telehealth</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">DDH</term>
          <def>
            <p>developmental dysplasia of the hip</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">DDH-KT</term>
          <def>
            <p>developmental dysplasia of the hip knowledge test</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">eHEALS</term>
          <def>
            <p>eHealth Literacy Scale</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">FKGL</term>
          <def>
            <p>Flesch-Kincaid Grade Level</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">FKRE</term>
          <def>
            <p>Flesch-Kincaid Reading Ease</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">HISBS</term>
          <def>
            <p>Health Information-Seeking Behavior Scale</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">HRPS</term>
          <def>
            <p>Health Risk Perception Scale</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">ICC</term>
          <def>
            <p>intraclass correlation coefficient</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">ISES</term>
          <def>
            <p>Information Self-Efficacy Scale</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">PEMAT-P</term>
          <def>
            <p>Patient Education Materials Assessment Tool for Printable Materials</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">PUS</term>
          <def>
            <p>Perceived Usefulness Scale</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">RCT</term>
          <def>
            <p>randomized controlled trial</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb17">SMOG</term>
          <def>
            <p>Simple Measure of Gobbledygook</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <notes>
      <sec>
        <title>Funding</title>
        <p>This work was supported by the Guangdong Provincial Education Science Planning Project (Higher Education Research Special Topic) for 2025 (2025GXJK0331); the Science and Technology Program of Guangzhou Sports Bureau for 2025 (ST20250986); the Nursing Research Special Program of Southern Medical University for 2025 (Y2025008); the Education and Teaching Research Project of The Third Affiliated Hospital, Southern Medical University, for 2025 (JXY202517); and the President Foundation of The Third Affiliated Hospital, Southern Medical University, for 2022 (YH202207).</p>
      </sec>
    </notes>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The full data supporting this study, including scoring data from phase 1 and outcomes from phase 2, can be accessed from the Multimedia Appendices.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>Conceptualization: YL</p>
        <p>Data curation: HO, ZY, YL</p>
        <p>Formal analysis: GL, JY</p>
        <p>Funding acquisition: YC</p>
        <p>Methodology: YL</p>
        <p>Supervision: FQ, JY</p>
        <p>Validation: GL, HY</p>
        <p>Visualization: YL</p>
        <p>Writing – original draft: HO</p>
        <p>Writing – review &#38; editing: FQ, YC</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ling</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pei</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Prevalence of developmental dysplasia of the hip (DDH) in infants: a systematic review and meta-analysis</article-title>
          <source>BMJ Paediatr Open</source>
          <year>2023</year>
          <month>10</month>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>e002080</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37879719"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjpo-2023-002080</pub-id>
          <pub-id pub-id-type="medline">37879719</pub-id>
          <pub-id pub-id-type="pii">10.1136/bmjpo-2023-002080</pub-id>
          <pub-id pub-id-type="pmcid">PMC10603435</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>American Academy of Pediatrics</collab>
          </person-group>
          <article-title>Long-term outcome of delayed diagnosis of developmental hip dysplasia</article-title>
          <source>AAP Grand Rounds</source>
          <year>2020</year>
          <month>11</month>
          <volume>44</volume>
          <fpage>53</fpage>
          <lpage>53</lpage>
          <pub-id pub-id-type="doi">10.1542/gr.44-5-53</pub-id>
          <pub-id pub-id-type="medline">26033050</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kolb</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chiari</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Schreiner</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Heisinger</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Willegger</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rettl</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Windhager</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Development of an electronic navigation system for elimination of examiner-dependent factors in the ultrasound screening for developmental dysplasia of the hip in newborns</article-title>
          <source>Sci Rep</source>
          <year>2020</year>
          <month>10</month>
          <day>02</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>16407</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-020-73536-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-020-73536-9</pub-id>
          <pub-id pub-id-type="medline">33009470</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-020-73536-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC7532432</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bakarman</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Alsiddiky</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zamzam</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Alzain</surname>
              <given-names>KO</given-names>
            </name>
            <name name-style="western">
              <surname>Alhuzaimi</surname>
              <given-names>FS</given-names>
            </name>
            <name name-style="western">
              <surname>Rafiq</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Developmental dysplasia of the hip (DDH): etiology, diagnosis, and management</article-title>
          <source>Cureus</source>
          <year>2023</year>
          <volume>15</volume>
          <issue>8</issue>
          <fpage>e43207</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37692580"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.43207</pub-id>
          <pub-id pub-id-type="medline">37692580</pub-id>
          <pub-id pub-id-type="pmcid">PMC10488138</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pagano</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Holzapfel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kappenschneider</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Maderbacher</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Grifka</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Holzapfel</surname>
              <given-names>DE</given-names>
            </name>
          </person-group>
          <article-title>Arthrosis diagnosis and treatment recommendations in clinical practice: an exploratory investigation with the generative AI model GPT-4</article-title>
          <source>J Orthop Traumatol</source>
          <year>2023</year>
          <month>11</month>
          <day>28</day>
          <volume>24</volume>
          <issue>1</issue>
          <fpage>61</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38015298"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s10195-023-00740-4</pub-id>
          <pub-id pub-id-type="medline">38015298</pub-id>
          <pub-id pub-id-type="pii">10.1186/s10195-023-00740-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC10684473</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yun</surname>
              <given-names>JY</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>EK</given-names>
            </name>
          </person-group>
          <article-title>A comprehensive evaluation of ChatGPT consultation quality for augmentation mammoplasty: A comparative analysis between plastic surgeons and laypersons</article-title>
          <source>Int J Med Inform</source>
          <year>2023</year>
          <month>11</month>
          <volume>179</volume>
          <fpage>105219</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1386-5056(23)00237-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2023.105219</pub-id>
          <pub-id pub-id-type="medline">37776670</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(23)00237-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bernstein</surname>
              <given-names>IA</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>YV</given-names>
            </name>
            <name name-style="western">
              <surname>Govil</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Majid</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>RT</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shue</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chou</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Schehlein</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Christopher</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Groth</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Ludwig</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>SY</given-names>
            </name>
          </person-group>
          <article-title>Comparison of ophthalmologist and large language model chatbot responses to online patient eye care questions</article-title>
          <source>JAMA Netw Open</source>
          <year>2023</year>
          <month>08</month>
          <day>01</day>
          <volume>6</volume>
          <issue>8</issue>
          <fpage>e2330320</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37606922"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2023.30320</pub-id>
          <pub-id pub-id-type="medline">37606922</pub-id>
          <pub-id pub-id-type="pii">2808557</pub-id>
          <pub-id pub-id-type="pmcid">PMC10445188</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dağci</surname>
              <given-names>Mahmut</given-names>
            </name>
            <name name-style="western">
              <surname>Çam</surname>
              <given-names>Funda</given-names>
            </name>
            <name name-style="western">
              <surname>Dost</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Reliability and quality of the nursing care planning texts generated by ChatGPT</article-title>
          <source>Nurse Educ</source>
          <year>2024</year>
          <volume>49</volume>
          <issue>3</issue>
          <fpage>E109</fpage>
          <lpage>E114</lpage>
          <pub-id pub-id-type="doi">10.1097/NNE.0000000000001566</pub-id>
          <pub-id pub-id-type="medline">37994523</pub-id>
          <pub-id pub-id-type="pii">00006223-202405000-00011</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Perez-Heydrich</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>DX</given-names>
            </name>
            <name name-style="western">
              <surname>Nellis</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT vs. web search for patient questions: what does ChatGPT do better?</article-title>
          <source>Eur Arch Otorhinolaryngol</source>
          <year>2024</year>
          <month>06</month>
          <volume>281</volume>
          <issue>6</issue>
          <fpage>3219</fpage>
          <lpage>3225</lpage>
          <pub-id pub-id-type="doi">10.1007/s00405-024-08524-0</pub-id>
          <pub-id pub-id-type="medline">38416195</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00405-024-08524-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC11410109</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hopkins</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Logan</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Kichenadasse</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Sorich</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence chatbots will revolutionize how cancer patients access information: ChatGPT represents a paradigm-shift</article-title>
          <source>JNCI Cancer Spectr</source>
          <year>2023</year>
          <month>03</month>
          <day>01</day>
          <volume>7</volume>
          <issue>2</issue>
          <fpage>pkad010</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36808255"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jncics/pkad010</pub-id>
          <pub-id pub-id-type="medline">36808255</pub-id>
          <pub-id pub-id-type="pii">7049531</pub-id>
          <pub-id pub-id-type="pmcid">PMC10013638</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Amaral</surname>
              <given-names>JZ</given-names>
            </name>
            <name name-style="western">
              <surname>Schultz</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Touban</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>McGraw-Heinrich</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>McKay</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenfeld</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>BG</given-names>
            </name>
          </person-group>
          <article-title>Evaluating chat generative pre-trained transformer responses to common pediatric in-toeing questions</article-title>
          <source>J Pediatr Orthop</source>
          <year>2024</year>
          <month>08</month>
          <day>01</day>
          <volume>44</volume>
          <issue>7</issue>
          <fpage>e592</fpage>
          <lpage>e597</lpage>
          <pub-id pub-id-type="doi">10.1097/BPO.0000000000002695</pub-id>
          <pub-id pub-id-type="medline">38686934</pub-id>
          <pub-id pub-id-type="pii">01241398-990000000-00553</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alber</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Alyakin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rai</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Valliani</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenbaum</surname>
              <given-names>GR</given-names>
            </name>
            <name name-style="western">
              <surname>Amend-Thomas</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Kurland</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Kremer</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Eremiev</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Negash</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Wiggan</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Nakatsuka</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Sangwon</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Neifert</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Save</surname>
              <given-names>AV</given-names>
            </name>
            <name name-style="western">
              <surname>Palla</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Grin</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Hedman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nasir-Moin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>XC</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>LY</given-names>
            </name>
            <name name-style="western">
              <surname>Mankowski</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Segev</surname>
              <given-names>DL</given-names>
            </name>
            <name name-style="western">
              <surname>Aphinyanaphongs</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Riina</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Golfinos</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Orringer</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Kondziolka</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Oermann</surname>
              <given-names>EK</given-names>
            </name>
          </person-group>
          <article-title>Medical large language models are vulnerable to data-poisoning attacks</article-title>
          <source>Nat Med</source>
          <year>2025</year>
          <month>02</month>
          <volume>31</volume>
          <issue>2</issue>
          <fpage>618</fpage>
          <lpage>626</lpage>
          <pub-id pub-id-type="doi">10.1038/s41591-024-03445-1</pub-id>
          <pub-id pub-id-type="medline">39779928</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-024-03445-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC11835729</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>On hallucination and predictive uncertainty in conditional language generation</article-title>
          <source>Association for Computational Linguistics</source>
          <year>2021</year>
          <month>4</month>
          <conf-name>Proceedings of the 16th Conference of the European Chapter of the Association for Computational Linguistics: Main Volume</conf-name>
          <conf-date>2021</conf-date>
          <conf-loc>Online</conf-loc>
          <fpage>2734</fpage>
          <lpage>2744</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2021.eacl-main.236</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aydin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Karabacak</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vlachos</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Margetis</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Large language models in patient education: a scoping review of applications in medicine</article-title>
          <source>Front Med (Lausanne)</source>
          <year>2024</year>
          <month>10</month>
          <volume>11</volume>
          <fpage>1477898</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3389/fmed.2024.1477898"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fmed.2024.1477898</pub-id>
          <pub-id pub-id-type="medline">39534227</pub-id>
          <pub-id pub-id-type="pmcid">PMC11554522</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ayers</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Poliak</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dredze</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Leas</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Kelley</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Faix</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Goodman</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Longhurst</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Hogarth</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>Comparing physician and artificial intelligence chatbot responses to patient questions posted to a public social media forum</article-title>
          <source>JAMA Intern Med</source>
          <year>2023</year>
          <month>06</month>
          <day>01</day>
          <volume>183</volume>
          <issue>6</issue>
          <fpage>589</fpage>
          <lpage>596</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37115527"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamainternmed.2023.1838</pub-id>
          <pub-id pub-id-type="medline">37115527</pub-id>
          <pub-id pub-id-type="pii">2804309</pub-id>
          <pub-id pub-id-type="pmcid">PMC10148230</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Boland</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Graham</surname>
              <given-names>ID</given-names>
            </name>
            <name name-style="western">
              <surname>Légaré</surname>
              <given-names>France</given-names>
            </name>
            <name name-style="western">
              <surname>Lewis</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Jull</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shephard</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lawson</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yameogo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Stacey</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Barriers and facilitators of pediatric shared decision-making: a systematic review</article-title>
          <source>Implement Sci</source>
          <year>2019</year>
          <month>01</month>
          <day>18</day>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>7</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://implementationscience.biomedcentral.com/articles/10.1186/s13012-018-0851-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13012-018-0851-5</pub-id>
          <pub-id pub-id-type="medline">30658670</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13012-018-0851-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC6339273</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bloom</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Engelhart</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Furst</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>WH</given-names>
            </name>
          </person-group>
          <source>Taxonomy of Educational Objectives</source>
          <year>1964</year>
          <publisher-loc>New York</publisher-loc>
          <publisher-name>Longmans, Green</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Al-Haj Ali</surname>
              <given-names>Sanaa N</given-names>
            </name>
          </person-group>
          <article-title>Emergency management of permanent tooth avulsion: comparative performance of dental students and artificial intelligence using a multimodal clinical vignette across Bloom's taxonomy domains</article-title>
          <source>Int Endod J</source>
          <year>2025</year>
          <month>11</month>
          <day>11</day>
          <comment>(forthcoming)</comment>
          <pub-id pub-id-type="doi">10.1111/iej.70060</pub-id>
          <pub-id pub-id-type="medline">41216987</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>American Institute of Ultrasound in Medicine</collab>
          </person-group>
          <article-title>AIUM practice guideline for the performance of an ultrasound examination for detection and assessment of developmental dysplasia of the hip</article-title>
          <source>J Ultrasound Med</source>
          <year>2013</year>
          <month>07</month>
          <volume>32</volume>
          <issue>7</issue>
          <fpage>1307</fpage>
          <lpage>1317</lpage>
          <pub-id pub-id-type="doi">10.7863/ultra.32.7.1307</pub-id>
          <pub-id pub-id-type="medline">23804356</pub-id>
          <pub-id pub-id-type="pii">32/7/1307</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <article-title>AIUM-ACR-SPR-SRU practice parameter for the performance of an ultrasound examination for detection and assessment of developmental dysplasia of the hip</article-title>
          <source>J Ultrasound Med</source>
          <year>2018</year>
          <volume>37</volume>
          <issue>11</issue>
          <fpage>E1</fpage>
          <lpage>E5</lpage>
          <pub-id pub-id-type="doi">10.1002/jum.14829</pub-id>
          <pub-id pub-id-type="medline">30308084</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>Committee on Quality Improvement</collab>
            <collab>Subcommittee on Developmental Dysplasia of the Hip</collab>
            <collab>American Academy of Pediatrics</collab>
          </person-group>
          <article-title>Clinical practice guideline: early detection of developmental dysplasia of the hip</article-title>
          <source>Pediatrics</source>
          <year>2000</year>
          <month>04</month>
          <volume>105</volume>
          <fpage>896</fpage>
          <lpage>905</lpage>
          <pub-id pub-id-type="doi">10.1542/peds.105.4.896</pub-id>
          <pub-id pub-id-type="medline">10742345</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Dorfman</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Rigsby</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Iyer</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Alazraki</surname>
              <given-names>Adina L</given-names>
            </name>
            <name name-style="western">
              <surname>Anupindi</surname>
              <given-names>Sudha A</given-names>
            </name>
            <name name-style="western">
              <surname>Bardo</surname>
              <given-names>Dianna M E</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>Brandon P</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>Sherwin S</given-names>
            </name>
            <name name-style="western">
              <surname>Chandra</surname>
              <given-names>Tushar</given-names>
            </name>
            <name name-style="western">
              <surname>Garber</surname>
              <given-names>Matthew D</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>Michael M</given-names>
            </name>
            <name name-style="western">
              <surname>Pandya</surname>
              <given-names>Nirav K</given-names>
            </name>
            <name name-style="western">
              <surname>Shet</surname>
              <given-names>Narendra S</given-names>
            </name>
            <name name-style="western">
              <surname>Siegel</surname>
              <given-names>Alan</given-names>
            </name>
            <name name-style="western">
              <surname>Karmazyn</surname>
              <given-names>Boaz</given-names>
            </name>
          </person-group>
          <article-title>ACR Appropriateness Criteria developmental dysplasia of the hip-child</article-title>
          <source>J Am Coll Radiol</source>
          <year>2019</year>
          <month>05</month>
          <volume>16</volume>
          <issue>5S</issue>
          <fpage>S94</fpage>
          <lpage>S103</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jacr.2019.02.014</pub-id>
          <pub-id pub-id-type="medline">31054762</pub-id>
          <pub-id pub-id-type="pii">S1546-1440(19)30154-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mulpuri</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Gross</surname>
              <given-names>RH</given-names>
            </name>
            <name name-style="western">
              <surname>Tebor</surname>
              <given-names>GB</given-names>
            </name>
            <name name-style="western">
              <surname>Otsuka</surname>
              <given-names>NY</given-names>
            </name>
            <name name-style="western">
              <surname>Lubicky</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Szalay</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Harcke</surname>
              <given-names>HT</given-names>
            </name>
            <name name-style="western">
              <surname>Zehr</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Spooner</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Campos-Outcalt</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Henningsen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jevsevar</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Goldberg</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Brox</surname>
              <given-names>WT</given-names>
            </name>
            <name name-style="western">
              <surname>Shea</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Bozic</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Shaffer</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Cummins</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Murray</surname>
              <given-names>JN</given-names>
            </name>
            <name name-style="western">
              <surname>Mohiuddin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shores</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Woznica</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Martinez</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sevarino</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>The American Academy of Orthopaedic Surgeons evidence-based guideline on detection and nonoperative management of pediatric developmental dysplasia of the hip in infants up to six months of age</article-title>
          <source>J Bone Joint Surg Am</source>
          <year>2015</year>
          <month>10</month>
          <day>21</day>
          <volume>97</volume>
          <issue>20</issue>
          <fpage>1717</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.2106/JBJS.O.00500</pub-id>
          <pub-id pub-id-type="medline">26491137</pub-id>
          <pub-id pub-id-type="pii">97/20/1717</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Charnock</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Shepperd</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Needham</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gann</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>DISCERN: an instrument for judging the quality of written consumer health information on treatment choices</article-title>
          <source>J Epidemiol Community Health</source>
          <year>1999</year>
          <month>02</month>
          <volume>53</volume>
          <issue>2</issue>
          <fpage>105</fpage>
          <lpage>111</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jech.bmj.com/lookup/pmidlookup?view=long&#38;pmid=10396471"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/jech.53.2.105</pub-id>
          <pub-id pub-id-type="medline">10396471</pub-id>
          <pub-id pub-id-type="pmcid">PMC1756830</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shoemaker</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wolf</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Brach</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Development of the Patient Education Materials Assessment Tool (PEMAT): a new measure of understandability and actionability for print and audiovisual patient information</article-title>
          <source>Patient Educ Couns</source>
          <year>2014</year>
          <month>09</month>
          <volume>96</volume>
          <issue>3</issue>
          <fpage>395</fpage>
          <lpage>403</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/24973195"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.pec.2014.05.027</pub-id>
          <pub-id pub-id-type="medline">24973195</pub-id>
          <pub-id pub-id-type="pii">S0738-3991(14)00233-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC5085258</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kestel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Çalık</surname>
              <given-names>Afra</given-names>
            </name>
            <name name-style="western">
              <surname>Kuş</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The effect of chatbot-supported instruction on nursing students' history-taking questioning skills and stress level: a randomized controlled study</article-title>
          <source>J Prof Nurs</source>
          <year>2025</year>
          <volume>60</volume>
          <fpage>93</fpage>
          <lpage>100</lpage>
          <pub-id pub-id-type="doi">10.1016/j.profnurs.2025.07.004</pub-id>
          <pub-id pub-id-type="medline">40915772</pub-id>
          <pub-id pub-id-type="pii">S8755-7223(25)00108-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="web">
          <article-title>Hip dysplasia</article-title>
          <source>Wikipedia</source>
          <access-date>2026-01-06</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://en.wikipedia.org/wiki/Hip_dysplasia">https://en.wikipedia.org/wiki/Hip_dysplasia</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Norman</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Skinner</surname>
              <given-names>HA</given-names>
            </name>
          </person-group>
          <article-title>eHEALS: The eHealth Literacy Scale</article-title>
          <source>J Med Internet Res</source>
          <year>2006</year>
          <month>11</month>
          <day>14</day>
          <volume>8</volume>
          <issue>4</issue>
          <fpage>e27</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2006/4/e27/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.8.4.e27</pub-id>
          <pub-id pub-id-type="medline">17213046</pub-id>
          <pub-id pub-id-type="pii">v8i4e27</pub-id>
          <pub-id pub-id-type="pmcid">PMC1794004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ajzen</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <source>Understanding Attitudes and Predicting Social Behavior</source>
          <year>1980</year>
          <publisher-loc>Englewood Cliffs, NJ</publisher-loc>
          <publisher-name>Prentice-Hall</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brewer</surname>
              <given-names>NT</given-names>
            </name>
            <name name-style="western">
              <surname>Weinstein</surname>
              <given-names>ND</given-names>
            </name>
            <name name-style="western">
              <surname>Cuite</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Herrington</surname>
              <given-names>JE</given-names>
            </name>
          </person-group>
          <article-title>Risk perceptions and their relation to risk behavior</article-title>
          <source>Ann Behav Med</source>
          <year>2004</year>
          <month>04</month>
          <volume>27</volume>
          <issue>2</issue>
          <fpage>125</fpage>
          <lpage>130</lpage>
          <pub-id pub-id-type="doi">10.1207/s15324796abm2702_7</pub-id>
          <pub-id pub-id-type="medline">15026296</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>Pavlou</collab>
            <collab>Fygenson</collab>
          </person-group>
          <article-title>Understanding and predicting electronic commerce adoption: an extension of the theory of planned behavior</article-title>
          <source>MIS Q</source>
          <year>2006</year>
          <volume>30</volume>
          <issue>1</issue>
          <fpage>115</fpage>
          <lpage>143</lpage>
          <pub-id pub-id-type="doi">10.2307/25148720</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cheung</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Rabjohn</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>The impact of electronic word‐of‐mouth</article-title>
          <source>Internet Res</source>
          <year>2008</year>
          <volume>18</volume>
          <issue>3</issue>
          <fpage>229</fpage>
          <lpage>247</lpage>
          <pub-id pub-id-type="doi">10.1108/10662240810883290</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>Kankanhalli</collab>
            <collab>Tan</collab>
            <collab>Wei</collab>
          </person-group>
          <article-title>Contributing knowledge to electronic knowledge repositories: an empirical investigation</article-title>
          <source>MIS Q</source>
          <year>2005</year>
          <volume>29</volume>
          <issue>1</issue>
          <fpage>113</fpage>
          <lpage>144</lpage>
          <pub-id pub-id-type="doi">10.2307/25148670</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Koo</surname>
              <given-names>TK</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>MY</given-names>
            </name>
          </person-group>
          <article-title>A guideline of selecting and reporting intraclass correlation coefficients for reliability research</article-title>
          <source>J Chiropr Med</source>
          <year>2016</year>
          <month>06</month>
          <volume>15</volume>
          <issue>2</issue>
          <fpage>155</fpage>
          <lpage>163</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27330520"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jcm.2016.02.012</pub-id>
          <pub-id pub-id-type="medline">27330520</pub-id>
          <pub-id pub-id-type="pii">S1556-3707(16)00015-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC4913118</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jacobson</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Follette</surname>
              <given-names>WC</given-names>
            </name>
            <name name-style="western">
              <surname>Revenstorf</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Psychotherapy outcome research: methods for reporting variability and evaluating clinical significance</article-title>
          <source>Behavior Therapy</source>
          <year>1984</year>
          <month>09</month>
          <volume>15</volume>
          <issue>4</issue>
          <fpage>336</fpage>
          <lpage>352</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/S0005-7894(84)80002-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/s0005-7894(84)80002-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Doak</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Doak</surname>
              <given-names>LG</given-names>
            </name>
            <name name-style="western">
              <surname>Friedell</surname>
              <given-names>GH</given-names>
            </name>
            <name name-style="western">
              <surname>Meade</surname>
              <given-names>CD</given-names>
            </name>
          </person-group>
          <article-title>Improving comprehension for cancer patients with low literacy skills: strategies for clinicians</article-title>
          <source>CA Cancer J Clin</source>
          <year>1998</year>
          <volume>48</volume>
          <issue>3</issue>
          <fpage>151</fpage>
          <lpage>162</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://onlinelibrary.wiley.com/resolve/openurl?genre=article&#38;sid=nlm:pubmed&#38;issn=0007-9235&#38;date=1998&#38;volume=48&#38;issue=3&#38;spage=151"/>
          </comment>
          <pub-id pub-id-type="doi">10.3322/canjclin.48.3.151</pub-id>
          <pub-id pub-id-type="medline">9594918</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chinn</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>McGuirt</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Puri</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>The readability of online patient education materials from major anesthesiology associations and the American Society of Anesthesiologists</article-title>
          <source>OJAnes</source>
          <year>2014</year>
          <volume>04</volume>
          <issue>01</issue>
          <fpage>1</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.4236/ojanes.2014.41001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Michel</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Dijanic</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Abdelmalek</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Sudah</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kerrigan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gorgy</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Yalamanchili</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Readability assessment of patient educational materials for pediatric spinal deformity from top academic orthopedic institutions</article-title>
          <source>Spine Deform</source>
          <year>2022</year>
          <month>11</month>
          <volume>10</volume>
          <issue>6</issue>
          <fpage>1315</fpage>
          <lpage>1321</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35819724"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s43390-022-00545-1</pub-id>
          <pub-id pub-id-type="medline">35819724</pub-id>
          <pub-id pub-id-type="pii">10.1007/s43390-022-00545-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC9579064</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dihan</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Chauhan</surname>
              <given-names>MZ</given-names>
            </name>
            <name name-style="western">
              <surname>Eleiwa</surname>
              <given-names>TK</given-names>
            </name>
            <name name-style="western">
              <surname>Hassan</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Sallam</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Khouri</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Elhusseiny</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Using large language models to generate educational materials on childhood glaucoma</article-title>
          <source>Am J Ophthalmol</source>
          <year>2024</year>
          <month>09</month>
          <volume>265</volume>
          <fpage>28</fpage>
          <lpage>38</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ajo.2024.04.004</pub-id>
          <pub-id pub-id-type="medline">38614196</pub-id>
          <pub-id pub-id-type="pii">S0002-9394(24)00144-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hernandez</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Guizar</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Avetisian</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Abdou</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Karakash</surname>
              <given-names>WJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ton</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gallo</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Ball</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Alluri</surname>
              <given-names>RK</given-names>
            </name>
            <name name-style="western">
              <surname>Hah</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Safaee</surname>
              <given-names>MM</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the accuracy and readability of ChatGPT in addressing patient queries on adult spinal deformity surgery</article-title>
          <source>Global Spine J</source>
          <year>2025</year>
          <month>07</month>
          <day>11</day>
          <fpage>21925682251360655</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/21925682251360655?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/21925682251360655</pub-id>
          <pub-id pub-id-type="medline">40643892</pub-id>
          <pub-id pub-id-type="pmcid">PMC12254131</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ray</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rudolph</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Daugherty</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Bloom's taxonomy in health professions education: associations with exam scores, clinical reasoning, and instructional effectiveness</article-title>
          <source>Curr Pharm Teach Learn</source>
          <year>2025</year>
          <month>11</month>
          <volume>17</volume>
          <issue>11</issue>
          <fpage>102444</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.cptl.2025.102444"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.cptl.2025.102444</pub-id>
          <pub-id pub-id-type="medline">40695205</pub-id>
          <pub-id pub-id-type="pii">S1877-1297(25)00165-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>An</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Hwang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>RW</given-names>
            </name>
            <name name-style="western">
              <surname>An</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Clinical performance and communication skills of ChatGPT versus physicians in emergency medicine: simulated patient study</article-title>
          <source>JMIR Med Inform</source>
          <year>2025</year>
          <month>07</month>
          <day>17</day>
          <volume>13</volume>
          <fpage>e68409</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2025//e68409/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/68409</pub-id>
          <pub-id pub-id-type="medline">40674718</pub-id>
          <pub-id pub-id-type="pii">v13i1e68409</pub-id>
          <pub-id pub-id-type="pmcid">PMC12289221</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ouyang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>She</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Xue</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mou</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Qi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT's role in alleviating anxiety in total knee arthroplasty consent process: a randomized controlled trial pilot study</article-title>
          <source>Int J Surg</source>
          <year>2025</year>
          <month>03</month>
          <day>01</day>
          <volume>111</volume>
          <issue>3</issue>
          <fpage>2546</fpage>
          <lpage>2557</lpage>
          <pub-id pub-id-type="doi">10.1097/JS9.0000000000002223</pub-id>
          <pub-id pub-id-type="medline">39903546</pub-id>
          <pub-id pub-id-type="pii">01279778-990000000-02142</pub-id>
          <pub-id pub-id-type="pmcid">PMC12372728</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Akdogan</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Uyar</surname>
              <given-names>GC</given-names>
            </name>
            <name name-style="western">
              <surname>Yesilbas</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Baskurt</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Malkoc</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Ozdemir</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Yazici</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Oksuzoglu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Uner</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ozet</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sutcuoglu</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Effect of a ChatGPT-based digital counseling intervention on anxiety and depression in patients with cancer: a prospective, randomized trial</article-title>
          <source>Eur J Cancer</source>
          <year>2025</year>
          <month>05</month>
          <day>15</day>
          <volume>221</volume>
          <fpage>115408</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ejca.2025.115408</pub-id>
          <pub-id pub-id-type="medline">40215593</pub-id>
          <pub-id pub-id-type="pii">S0959-8049(25)00189-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tong</surname>
              <given-names>ACY</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>KTY</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>WWT</given-names>
            </name>
            <name name-style="western">
              <surname>Mak</surname>
              <given-names>WWS</given-names>
            </name>
          </person-group>
          <article-title>Effectiveness of topic-based chatbots on mental health self-care and mental well-being: randomized controlled trial</article-title>
          <source>J Med Internet Res</source>
          <year>2025</year>
          <month>04</month>
          <day>30</day>
          <volume>27</volume>
          <fpage>e70436</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2025//e70436/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/70436</pub-id>
          <pub-id pub-id-type="medline">40306635</pub-id>
          <pub-id pub-id-type="pii">v27i1e70436</pub-id>
          <pub-id pub-id-type="pmcid">PMC12079066</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Su</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kostenko</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Schmid</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>DeMaria</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Villa</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Swarup</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Weida</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tuuli</surname>
              <given-names>MG</given-names>
            </name>
          </person-group>
          <article-title>Chatbot for patient education for prenatal aneuploidy testing: a multicenter randomized controlled trial</article-title>
          <source>Patient Educ Couns</source>
          <year>2025</year>
          <month>02</month>
          <volume>131</volume>
          <fpage>108557</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0738-3991(24)00424-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.pec.2024.108557</pub-id>
          <pub-id pub-id-type="medline">39642634</pub-id>
          <pub-id pub-id-type="pii">S0738-3991(24)00424-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Milne-Ives</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>de Cock</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Shehadeh</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>de Pennington</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Mole</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Normando</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Meinert</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>The effectiveness of artificial intelligence conversational agents in health care: systematic review</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>10</month>
          <day>22</day>
          <volume>22</volume>
          <issue>10</issue>
          <fpage>e20346</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/10/e20346/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/20346</pub-id>
          <pub-id pub-id-type="medline">33090118</pub-id>
          <pub-id pub-id-type="pii">v22i10e20346</pub-id>
          <pub-id pub-id-type="pmcid">PMC7644372</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McMahon</surname>
              <given-names>HV</given-names>
            </name>
            <name name-style="western">
              <surname>McMahon</surname>
              <given-names>BD</given-names>
            </name>
          </person-group>
          <article-title>Automating untruths: ChatGPT, self-managed medication abortion, and the threat of misinformation in a post- world</article-title>
          <source>Front Digit Health</source>
          <year>2024</year>
          <volume>6</volume>
          <fpage>1287186</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38419805"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fdgth.2024.1287186</pub-id>
          <pub-id pub-id-type="medline">38419805</pub-id>
          <pub-id pub-id-type="pmcid">PMC10900507</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ponzo</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Goitre</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Favaro</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Merlo</surname>
              <given-names>FD</given-names>
            </name>
            <name name-style="western">
              <surname>Mancino</surname>
              <given-names>MV</given-names>
            </name>
            <name name-style="western">
              <surname>Riso</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bo</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Is ChatGPT an effective tool for providing dietary advice?</article-title>
          <source>Nutrients</source>
          <year>2024</year>
          <month>02</month>
          <day>06</day>
          <volume>16</volume>
          <issue>4</issue>
          <fpage>469</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=nu16040469"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/nu16040469</pub-id>
          <pub-id pub-id-type="medline">38398794</pub-id>
          <pub-id pub-id-type="pii">nu16040469</pub-id>
          <pub-id pub-id-type="pmcid">PMC10892804</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dhar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kothari</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Vasquez</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Clarke</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Maroda</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>McClain</surname>
              <given-names>WG</given-names>
            </name>
            <name name-style="western">
              <surname>Sheyn</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tuliszewski</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Rangarajan</surname>
              <given-names>SV</given-names>
            </name>
          </person-group>
          <article-title>The utility and accuracy of ChatGPT in providing post-operative instructions following tonsillectomy: a pilot study</article-title>
          <source>Int J Pediatr Otorhinolaryngol</source>
          <year>2024</year>
          <month>04</month>
          <volume>179</volume>
          <fpage>111901</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ijporl.2024.111901</pub-id>
          <pub-id pub-id-type="medline">38447265</pub-id>
          <pub-id pub-id-type="pii">S0165-5876(24)00055-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abreu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Murimwa</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Farah</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Rodriguez</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sweetenham</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zeh</surname>
              <given-names>H J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S C</given-names>
            </name>
            <name name-style="western">
              <surname>Polanco</surname>
              <given-names>P M</given-names>
            </name>
          </person-group>
          <article-title>Enhancing readability of online patient-facing content: the role of AI chatbots in improving cancer information accessibility</article-title>
          <source>J Natl Compr Canc Netw</source>
          <year>2024</year>
          <month>05</month>
          <day>15</day>
          <volume>22</volume>
          <issue>2 D</issue>
          <fpage>e237334</fpage>
          <pub-id pub-id-type="doi">10.6004/jnccn.2023.7334</pub-id>
          <pub-id pub-id-type="medline">38749478</pub-id>
          <pub-id pub-id-type="pii">e237334</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wah</surname>
              <given-names>JNK</given-names>
            </name>
          </person-group>
          <article-title>Revolutionizing e-health: the transformative role of AI-powered hybrid chatbots in healthcare solutions</article-title>
          <source>Front Public Health</source>
          <year>2025</year>
          <volume>13</volume>
          <fpage>1530799</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3389/fpubh.2025.1530799"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpubh.2025.1530799</pub-id>
          <pub-id pub-id-type="medline">40017541</pub-id>
          <pub-id pub-id-type="pmcid">PMC11865260</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goodman</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lambert</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Scoping review of the preferences of older adults for patient education materials</article-title>
          <source>Patient Educ Couns</source>
          <year>2023</year>
          <month>03</month>
          <volume>108</volume>
          <fpage>107591</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.pec.2022.107591"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.pec.2022.107591</pub-id>
          <pub-id pub-id-type="medline">36584555</pub-id>
          <pub-id pub-id-type="pii">S0738-3991(22)00875-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Şahin</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Topkaç</surname>
              <given-names>Erdem Can</given-names>
            </name>
            <collab>Doğan</collab>
            <name name-style="western">
              <surname>Şeramet</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Özcan</surname>
              <given-names>Rıdvan</given-names>
            </name>
            <name name-style="western">
              <surname>Akgül</surname>
              <given-names>Murat</given-names>
            </name>
            <name name-style="western">
              <surname>Yazıcı</surname>
              <given-names>CM</given-names>
            </name>
          </person-group>
          <article-title>Still using only ChatGPT? The comparison of five different artificial intelligence chatbots' answers to the most common questions about kidney stones</article-title>
          <source>J Endourol</source>
          <year>2024</year>
          <month>11</month>
          <volume>38</volume>
          <issue>11</issue>
          <fpage>1172</fpage>
          <lpage>1177</lpage>
          <pub-id pub-id-type="doi">10.1089/end.2024.0474</pub-id>
          <pub-id pub-id-type="medline">39212674</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Busch</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffmann</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Rueger</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>van Dijk</surname>
              <given-names>EH</given-names>
            </name>
            <name name-style="western">
              <surname>Kader</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ortiz-Prado</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Makowski</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Saba</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hadamitzky</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kather</surname>
              <given-names>JN</given-names>
            </name>
            <name name-style="western">
              <surname>Truhn</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cuocolo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Adams</surname>
              <given-names>LC</given-names>
            </name>
            <name name-style="western">
              <surname>Bressem</surname>
              <given-names>KK</given-names>
            </name>
          </person-group>
          <article-title>Current applications and challenges in large language models for patient care: a systematic review</article-title>
          <source>Commun Med (Lond)</source>
          <year>2025</year>
          <month>01</month>
          <day>21</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>26</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s43856-024-00717-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s43856-024-00717-2</pub-id>
          <pub-id pub-id-type="medline">39838160</pub-id>
          <pub-id pub-id-type="pii">10.1038/s43856-024-00717-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC11751060</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haltaufderheide</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ranisch</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>The ethics of ChatGPT in medicine and healthcare: a systematic review on large language models (LLMs)</article-title>
          <source>NPJ Digit Med</source>
          <year>2024</year>
          <month>07</month>
          <day>08</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>183</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-024-01157-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-024-01157-x</pub-id>
          <pub-id pub-id-type="medline">38977771</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-024-01157-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC11231310</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pei</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Piao</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Using ChatGPT in nursing: scoping review of current opinions</article-title>
          <source>JMIR Med Educ</source>
          <year>2024</year>
          <month>11</month>
          <day>19</day>
          <volume>10</volume>
          <fpage>e54297</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mededu.jmir.org/2024//e54297/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/54297</pub-id>
          <pub-id pub-id-type="medline">39622702</pub-id>
          <pub-id pub-id-type="pii">v10i1e54297</pub-id>
          <pub-id pub-id-type="pmcid">PMC11611787</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Berşe</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Akça</surname>
              <given-names>Kamile</given-names>
            </name>
            <name name-style="western">
              <surname>Dirgar</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kaplan Serin</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>The role and potential contributions of the artificial intelligence language model ChatGPT</article-title>
          <source>Ann Biomed Eng</source>
          <year>2024</year>
          <month>02</month>
          <volume>52</volume>
          <issue>2</issue>
          <fpage>130</fpage>
          <lpage>133</lpage>
          <pub-id pub-id-type="doi">10.1007/s10439-023-03296-w</pub-id>
          <pub-id pub-id-type="medline">37378876</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10439-023-03296-w</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tilton</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Caplan</surname>
              <given-names>BE</given-names>
            </name>
            <name name-style="western">
              <surname>Cole</surname>
              <given-names>BJ</given-names>
            </name>
          </person-group>
          <article-title>Generative AI in consumer health: leveraging large language models for health literacy and clinical safety with a digital health framework</article-title>
          <source>Front Digit Health</source>
          <year>2025</year>
          <volume>7</volume>
          <fpage>1616488</fpage>
          <pub-id pub-id-type="doi">10.3389/fdgth.2025.1616488</pub-id>
          <pub-id pub-id-type="medline">40933812</pub-id>
          <pub-id pub-id-type="pmcid">PMC12417475</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
