<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v27i1e62857</article-id>
      <article-id pub-id-type="pmid">40163853</article-id>
      <article-id pub-id-type="doi">10.2196/62857</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Ability of ChatGPT to Replace Doctors in Patient Education: Cross-Sectional Comparative Analysis of Inflammatory Bowel Disease</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Ma</surname>
            <given-names>Xiaomeng</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Hidki</surname>
            <given-names>Asmaa</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Pesälä</surname>
            <given-names>Samuli</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Wu</surname>
            <given-names>Chaochen</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Yan</surname>
            <given-names>Zelin</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0005-3123-4875</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Jingwen</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5179-1592</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Fan</surname>
            <given-names>Yihong</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9554-0541</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Lu</surname>
            <given-names>Shiyuan</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2825-8244</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>Dingting</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8728-2378</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>Yun</given-names>
          </name>
          <degrees>BS</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0009-3323-7569</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Honggang</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4761-0407</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Mao</surname>
            <given-names>Jie</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0006-9597-1249</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Tseng</surname>
            <given-names>Hou-Chiang</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5249-7280</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Chang</surname>
            <given-names>Tao-Hsing</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff8" ref-type="aff">8</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4390-5021</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Yan</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>Center of Inflammatory Bowel Diseases</institution>
            <institution>Department of Gastroenterology</institution>
            <institution>The Second Affiliated Hospital, Zhejiang University School of Medicine</institution>
            <addr-line>No 88, Jiefang Road</addr-line>
            <addr-line>Hangzhou, 310000</addr-line>
            <country>China</country>
            <fax>86 571 87783777</fax>
            <phone>86 13757118653</phone>
            <email>chenyan72_72@zju.edu.cn</email>
          </address>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3457-2560</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Zhejiang Provincial Key Laboratory of Gastrointestinal Diseases Pathophysiology</institution>
        <institution>Department of Gastroenterology</institution>
        <institution>The First Affiliated Hospital of Zhejiang Chinese Medical University</institution>
        <addr-line>Hangzhou</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Center of Inflammatory Bowel Diseases</institution>
        <institution>Department of Gastroenterology</institution>
        <institution>The Second Affiliated Hospital, Zhejiang University School of Medicine</institution>
        <addr-line>Hangzhou</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>The China Crohn’s &#38; Colitis Foundation</institution>
        <addr-line>Hangzhou</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>The Clinical Medical College</institution>
        <institution>Zhejiang University School of Medicine</institution>
        <addr-line>Hangzhou</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Department of Gastroenterology</institution>
        <institution>The Affiliated Huaian No.1 People’s Hospital of Nanjing Medical University</institution>
        <addr-line>Huai'an</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>The Second Clinical Medical College</institution>
        <institution>Zhejiang Chinese Medical University</institution>
        <addr-line>Hangzhou</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Graduate Institute of Digital Learning and Education</institution>
        <institution>National Taiwan University of Science and Technology</institution>
        <addr-line>Taipei</addr-line>
        <country>Taiwan</country>
      </aff>
      <aff id="aff8">
        <label>8</label>
        <institution>Department of Computer Science and Information Engineering</institution>
        <institution>National Kaohsiung University of Science and Technology</institution>
        <addr-line>Kaohsiung</addr-line>
        <country>Taiwan</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Yan Chen <email>chenyan72_72@zju.edu.cn</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2025</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>31</day>
        <month>3</month>
        <year>2025</year>
      </pub-date>
      <volume>27</volume>
      <elocation-id>e62857</elocation-id>
      <history>
        <date date-type="received">
          <day>3</day>
          <month>6</month>
          <year>2024</year>
        </date>
        <date date-type="rev-request">
          <day>23</day>
          <month>9</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>18</day>
          <month>11</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>19</day>
          <month>1</month>
          <year>2025</year>
        </date>
      </history>
      <copyright-statement>©Zelin Yan, Jingwen Liu, Yihong Fan, Shiyuan Lu, Dingting Xu, Yun Yang, Honggang Wang, Jie Mao, Hou-Chiang Tseng, Tao-Hsing Chang, Yan Chen. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 31.03.2025.</copyright-statement>
      <copyright-year>2025</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2025/1/e62857" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Although large language models (LLMs) such as ChatGPT show promise for providing specialized information, their quality requires further evaluation. This is especially true considering that these models are trained on internet text and the quality of health-related information available online varies widely.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of this study was to evaluate the performance of ChatGPT in the context of patient education for individuals with chronic diseases, comparing it with that of industry experts to elucidate its strengths and limitations.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>This evaluation was conducted in September 2023 by analyzing the responses of ChatGPT and specialist doctors to questions posed by patients with inflammatory bowel disease (IBD). We compared their performance in terms of subjective accuracy, empathy, completeness, and overall quality, as well as readability to support objective analysis.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>In a series of 1578 binary choice assessments, ChatGPT was preferred in 48.4% (95% CI 45.9%-50.9%) of instances. There were 12 instances where ChatGPT’s responses were unanimously preferred by all evaluators, compared with 17 instances for specialist doctors. In terms of overall quality, there was no significant difference between the responses of ChatGPT (3.98, 95% CI 3.93-4.02) and those of specialist doctors (3.95, 95% CI 3.90-4.00; <italic>t</italic><sub>524</sub>=0.95, <italic>P</italic>=.34), both being considered “good.” Although differences in accuracy (<italic>t</italic><sub>521</sub>=0.48, <italic>P</italic>=.63) and empathy (<italic>t</italic><sub>511</sub>=2.19, <italic>P</italic>=.03) lacked statistical significance, the completeness of textual output (<italic>t</italic><sub>509</sub>=9.27, <italic>P</italic>&#60;.001) was a distinct advantage of the LLM (ChatGPT). In the sections of the questionnaire where patients and doctors responded together (Q223-Q242), ChatGPT demonstrated inferior performance (<italic>t</italic><sub>36</sub>=2.91, <italic>P</italic>=.006). Regarding readability, no statistical difference was found between the responses of specialist doctors (median: 7th grade; Q1: 4th grade; Q3: 8th grade) and those of ChatGPT (median: 7th grade; Q1: 7th grade; Q3: 8th grade) according to the Mann-Whitney U test (<italic>P</italic>=.09). The overall quality of ChatGPT’s output exhibited strong correlations with other subdimensions (with empathy: <italic>r</italic>=0.842; with accuracy: <italic>r</italic>=0.839; with completeness: <italic>r</italic>=0.795), and there was also a high correlation between the subdimensions of accuracy and completeness (<italic>r</italic>=0.762).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>ChatGPT demonstrated more stable performance across various dimensions. Its output of health information content is more structurally sound, addressing the issue of variability in the information from individual specialist doctors. ChatGPT’s performance highlights its potential as an auxiliary tool for health information, despite limitations such as artificial intelligence hallucinations. It is recommended that patients be involved in the creation and evaluation of health information to enhance the quality and relevance of the information.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>AI-assisted</kwd>
        <kwd>patient education</kwd>
        <kwd>inflammatory bowel disease</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>ChatGPT</kwd>
        <kwd>patient communities</kwd>
        <kwd>social media</kwd>
        <kwd>disease management</kwd>
        <kwd>readability</kwd>
        <kwd>online health information</kwd>
        <kwd>conversational agents</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>In the medical field, large language models (LLMs), represented by ChatGPT, have shown significant application potential: In oncology, various brands of LLMs consistently generate relatively accurate and high-quality information, highlighting their potential as sources of medical information [<xref ref-type="bibr" rid="ref1">1</xref>]. From English to Chinese environments, LLMs have impressively passed their respective medical licensing exams, demonstrating their communication abilities in multilingual clinical settings and their foundational potential in medical education [<xref ref-type="bibr" rid="ref2">2</xref>-<xref ref-type="bibr" rid="ref4">4</xref>]. Whether the input text is everyday medical records or structured terminological reports, ChatGPT can swiftly interpret cues based on evidence-based guidelines, aiding health care providers in making informed decisions and showing significant potential in enhancing patient follow-up adherence [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. LLMs have showcased their “rich medical knowledge” and the ability to extract disease information from various languages and contexts. Their method of providing information in a “human-like” tone is considered more effective than traditional search engines [<xref ref-type="bibr" rid="ref7">7</xref>]. Despite a lack of evidence, these tools are being adopted by patients and clinical doctors [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref8">8</xref>]. The reason behind their excellent performance is that their text training set comes from a vast amount of publicly available internet information, making the quality of medical information provided by LLMs comparable to existing internet information [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>].</p>
      <p>Patients with chronic diseases themselves exhibit higher enthusiasm and realistic motivation in seeking health information and using web-based health technologies [<xref ref-type="bibr" rid="ref11">11</xref>]. Undoubtedly, as artificial intelligence (AI) applications become more widespread, an increasing number of patients will use this technology in practice, and the quality of health information can have a positive or negative impact on patients’ clinical outcomes [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. In the field of inflammatory bowel disease (IBD), the evaluation reports of health information, whether in Chinese or English, have been consistently mediocre, once deemed insufficient to meet patient needs [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref18">18</xref>]. When emerging AI tools replace static traditional internet information, the impact on patient education and self-management requires careful consideration and evaluation.</p>
      <p>Including Crohn disease and ulcerative colitis, IBD is an increasingly prevalent chronic intestinal disease in China, characterized by primary invasion of the digestive system and cumulative multisystem involvement of autoimmune diseases, with no cure currently available. Patients have a strong need to learn and reinforce self-care abilities, among which the WeChat public account of the China Crohn’s and Colitis Foundation (CCCF) is the most popular with IBD patients [<xref ref-type="bibr" rid="ref19">19</xref>]. We used it as a representative to study the patient education ecosystem for chronic diseases.</p>
      <p>This study aimed to evaluate ChatGPT’s ability to provide specialized vertical domain information, especially in the education of some patients with chronic disease, and compare it with industry experts. Through this comparison, we can identify the strengths and limitations of LLMs in medical information services, providing a basis for further improvement and application of the technology. Additionally, this study aimed to enhance the public and medical professionals’ awareness and acceptance of using AI tools in medical information acquisition and education.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Collection of Questions and the Original Doctor Responses</title>
        <p>The mode of one-on-one question-and-answer dialogue stands as a prevalent form of interaction within the health care domain. Across various medical applications, online forums, and instant messaging groups, a substantial portion of queries manifest as repetitive and amenable to categorization.</p>
        <p>In earlier epochs, we undertook the aggregation of high-frequency, prototypical questions posed by patients with IBD through online platforms and outpatient settings. We extended invitations to industry peers to collectively address these patient queries, culminating in the publication of a didactic tome titled “Q&#38;A on Ulcerative Colitis and Crohn’s Disease” tailored for the self-learning of individuals with inflammatory bowel ailments. This publication reflects the cumulative outcomes of doctor-patient interactions over 7 years at the CCCF and the Second Affiliated Hospital-Zhejiang University School of Medicine IBD Center encompassing 9000 cases. The compendium was predominantly curated by 8 seasoned IBD specialist doctors, with contributions from 55 IBD practitioners and 5 experienced patients with a high level of cultural acumen. Upon its publication, the book garnered commendations and accolades from numerous esteemed figures within the IBD community in China and the United States. The content delves into various aspects of IBD, including etiology, symptoms, diagnosis, treatment, follow-up protocols, and emotional support. The questions encapsulated within are highly representative and encompass a broad spectrum (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Many analogous questions have surfaced on pertinent social media platforms, with the content of this tome serving as a primary source of representative patient inquiries. Presently, the book has undergone 9 printings, with a distribution nearing 20,000 copies.</p>
        <p>The thematic essence of the book comprises 263 distinct questions matched with corresponding responses from doctors. Apart from a minor subset of emotional support content provided by patients, all responses are underpinned by evidence-based rationale. This sample size is anticipated to afford us a statistical power of 90% to discern a 10% differential between responses generated by ChatGPT and those proffered by medical practitioners (55% vs 45%; <xref rid="figure1" ref-type="fig">Figure 1</xref>).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Schematic of operational workflow. CRIE: Chinese Readability Index Explorer; IBD: inflammatory bowel disease.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e62857_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>To enhance the transparency and reproducibility of the experimental results, we did not use anonymized online medical consultation text for doctor-patient interactions. The content in the book was derived from authentic doctor-patient interactions, pre-authorized and publicly disclosed, with many excerpts being republished on social media platforms in electronic format [<xref ref-type="bibr" rid="ref20">20</xref>]. The data used in this study are publicly available and do not contain any identifiable personal information.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>Based on the assessment by the ethics committee, considering the nature and purpose of the research materials, as well as the practices in prior similar studies, it was determined that this study did not involve direct research on human participants and ultimately did not require ethical review [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref21">21</xref>-<xref ref-type="bibr" rid="ref23">23</xref>]. The content is used under authorization and license from Zhejiang University Press.</p>
      </sec>
      <sec>
        <title>Collecting ChatGPT Responses</title>
        <p>In the period from September 8, 2023, to September 22, 2023, ChatGPT responses were collected by inputting the original question text into a new chatbot session (GPT-3.5 version, OpenAI, August 3 version, 2023) and saving the chatbot replies [<xref ref-type="bibr" rid="ref24">24</xref>]. Differing from some other experimental methodologies, we adopted a sequential prompting of all questions listed in the directory within the same bot link [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. The rationale behind this approach includes the following.</p>
        <p>First, the original questions in the book contained terminology descriptions presumed to be familiar and comprehensible to health care professionals; for instance, in Chinese, the term [激素] “hormone” in the book and in IBD doctor-patient communication scenarios often specifically refers to [糖皮质激素] “glucocorticoids.” In a typical context, using [激素] “hormone” in communication may commonly lead individuals to think of “chemical messengers between cells,” and according to LLM principles, ChatGPT would respond to the latter in the absence of contextual elucidation. This measure was taken to mitigate the potential for the bot to provide accurate “incorrect responses” due to a lack of contextual background.</p>
        <p>Second, upon encountering the instances of the bot misinterpreting the language context, we continued to supplement vocabulary prompts to guide ChatGPT in understanding the true intent of the questioner, thereby eliciting a response that aligned with it. However, prompts were limited to no more than 3 times, drawing from the routine search habits of patients on the web and previous experiments [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref25">25</xref>].</p>
        <p>Third, to emulate the habitual reading practices and context of normal situations, we posed questions to ChatGPT in the same sequential order as presented in the book.</p>
      </sec>
      <sec>
        <title>Quality Control</title>
        <p>First, the final analytic sample encompassed 263 questions and their corresponding responses from doctors and ChatGPT, as featured in the ninth edition of “Q&#38;A on Ulcerative Colitis and Crohn’s Disease” printed in April 2022. Responses from doctors were designated as the benchmark.</p>
        <p>Second, some original responses in the book were provided by patients, and we retained this text, as it had undergone professional medical review before the book’s publication. It can be understood that, although drafted by patient volunteers, the expressions were approved by doctors and deemed suitable for new patients to view, primarily addressing psychological issues (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>).</p>
        <p>Third, original illustrations from the book were not excerpted, whereas tables were permitted. This decision was made because, when using ChatGPT, the model itself could generate tables, thus remaining unaffected.</p>
        <p>Fourth, at that time, the version of ChatGPT would randomly present 2 response options for user selection when prompted, with the first option being the default choice.</p>
        <p>Fifth, due to network issues, in the event of a crash or incomplete display, we would click “regenerate” once to select a complete text answer for material completion.</p>
      </sec>
      <sec>
        <title>Text Content Evaluation </title>
        <sec>
          <title>Subjective Assessment </title>
          <p>The assessment was conducted by 6 evaluators (3 licensed IBD doctors and 3 IBD patients). The doctors were experienced IBD physicians in patient education (YC, DX, HW), with over 10 years of clinical experience, having treated more than 500 patients with IBD, and engaged in patient education for over 5 years. The patient characteristics required were individuals aged between 20 years and 60 years, with at least an undergraduate education level, diagnosed with IBD for more than a year, and who had not read the “Questions and Answers” book. To ensure evaluators were as unable as possible to distinguish the source of the text, we used a blind method when presenting the materials to evaluators, concealing explanatory language such as “as an artificial intelligence.” The doctors’ responses and ChatGPT responses for the same question were anonymized and randomly labeled as Response 1 and Response 2. Evaluators were required to first read the question along with the corresponding doctors’ responses and ChatGPT response, followed by a 2-step evaluation process: (1) selecting the preferred answer version and (2) subjectively rating the 2 answers on a 5-point Likert scale for overall quality and dimensional evaluation, referencing dimensions from previous health information research [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>], including accuracy, empathy, and completeness. A higher score indicates greater evaluator approval of the response text’s performance in that dimension (see <xref ref-type="table" rid="table1">Table 1</xref> for details).</p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Definitions of each dimension and pretraining required for evaluators.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="150"/>
              <col width="850"/>
              <thead>
                <tr valign="top">
                  <td>Dimension</td>
                  <td>Definition</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Accuracy</td>
                  <td>Whether the response scientifically and impartially explains the issue, such as providing explanations on medication use and dosage, and clarifies surgical timing limitations</td>
                </tr>
                <tr valign="top">
                  <td>Completeness</td>
                  <td>Whether there are any omissions of important information or concepts in the explanation</td>
                </tr>
                <tr valign="top">
                  <td>Empathy</td>
                  <td>Whether the response demonstrates an understanding of the question from the perspective of the “patient” or the inquirer</td>
                </tr>
                <tr valign="top">
                  <td>Overall quality</td>
                  <td>Subjective perception of the overall quality of the text</td>
                </tr>
              </tbody>
            </table>
          </table-wrap>
        </sec>
        <sec>
          <title>Objective Evaluation</title>
          <p>The Chinese Readability Index Explorer (CRIE; version 3.0 [<xref ref-type="bibr" rid="ref26">26</xref>]) was used. In addition to the evaluators’ subjective assessments, we introduced a quantitative Chinese readability tool, CRIE. It consists of 4 subsystems comprising 82 multilevel language features [<xref ref-type="bibr" rid="ref27">27</xref>]. CRIE uses multilevel language features for text analysis, including vocabulary, syntax, semantics, and cohesion. This tool aids with analyzing various types of texts, such as Chinese textbooks [<xref ref-type="bibr" rid="ref28">28</xref>], foreign language learning materials [<xref ref-type="bibr" rid="ref29">29</xref>], and domain-specific knowledge texts [<xref ref-type="bibr" rid="ref30">30</xref>]. Numerous studies have validated its reliability and practicality in the Chinese health domain [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. Results can be interpreted using the Flesch-Kincaid English readability assessment method: the higher the grade, the greater the text complexity. Quantitative natural language processing and text mining tools serve as valuable supplements to subjective human evaluations [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
        </sec>
      </sec>
      <sec>
        <title>Data Statistics and Analysis</title>
        <sec>
          <title>Data Aggregation</title>
          <p>Aligned with the research objectives, we used a crowdsourced scoring strategy for data collection, a method that aggregates data across a collective of evaluators. Primarily applied in the field of linguistics, where language use is a fundamental domain for the general populace, the central idea is to harness the collective expertise of both experts and the public to pioneer new concepts through crowd annotations. This method is well-suited for subjective evaluations, such as scoring of singing by judges or the exploration of novel concepts. Calculating average scores for each dimension reflects the consistency variances among evaluators, encapsulating individual uncertainties and subjective biases within the variance of the scores [<xref ref-type="bibr" rid="ref21">21</xref>]. In the context of health text evaluation, the involvement of judges and the assessment method, involving direct quantification by both IBD health care providers and consumers, represents a feasible, efficient, cost-effective, and relatively accessible evaluation strategy.</p>
        </sec>
        <sec>
          <title>Primary Outcomes</title>
          <p>We conducted descriptive analysis and assessed evaluators’ preference ratios for ChatGPT using a chi-square goodness-of-fit test. A 2-tailed Welch <italic>t</italic> test was used to compare the mean values of the 2 responses. We defined a threshold score of 3 (acceptable) and calculated the proportion exceeding or falling below this threshold score (3), comparing them using prevalence ratios. Furthermore, we evaluated the Pearson correlation coefficients between the various subdimensions of quality to observe or predict correlations between different dimensions. Given that the readability of each response text is a calculated ordinal variable, nonparametric tests were used for comparison.</p>
        </sec>
        <sec>
          <title>Secondary Outcomes</title>
          <p>Subgroup <italic>t</italic> test analyses were conducted to assess the impact of evaluator identity (physician/patient) and the original response creator’s source (solely doctor/doctor-patient collaboration) on mean scores.</p>
          <p>A significance level of <italic>P</italic>&#60;.05 was set, and Bonferroni correction was applied for multiple tests. All statistical analyses were performed using R software (version 4.3.1 GUI 1.79 Big Sur ARM build) and RStudio (version 2023.09.1+494). Data visualization was created based on code references from the open-source platform Hiplot.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Preferred Response Ratio</title>
        <p>Of 1578 evaluations, evaluators showed a preference for ChatGPT responses at a rate of 48.4% (95% CI 45.9%-50.9%; <italic>P</italic>=.20). Among these, 6 evaluators exclusively favored ChatGPT responses for a total of 12 questions: 22, 28, 42, 56, 73, 120, 121, 124, 127, 161, 174, 195. Evaluators exclusively favored doctors’ responses for 17 questions: 5, 27, 41, 83, 85, 92, 156, 175, 180, 198, 205, 210, 219, 234, 237, 251, 263. The questions and corresponding responses from both doctors and the AI model are detailed in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>.</p>
      </sec>
      <sec>
        <title>Comparison of Mean Scores and Prevalence Ratio of Threshold Scores</title>
        <p>Overall, the proportion of responses rated below an acceptable quality (&#60;3) was 1.26 times higher for doctors’ responses than for ChatGPT responses (doctors: 3.3%, 95% CI 2.5%-4.4%; ChatGPT: 2.7%, 95% CI 1.9%-3.5%). Simultaneously, the proportion of responses rated as good or very good quality was 1.10 times higher for ChatGPT than for doctors (doctors: 69.4%, 95% CI 67.1%-71.7%; ChatGPT: 76%, 95% CI 73.7%-78%). Although ChatGPT had a slight advantage in the overall quality distribution, there was no significant difference between ChatGPT and doctors’ responses (t<sub>524</sub>=0.95, <italic>P</italic>=.34), with doctors’ (3.95, 95% CI 3.90-4.00) and ChatGPT responses (3.98, 95% CI 3.93-4.02) both rated at a “good” level.</p>
        <p>In terms of the completeness dimension, ChatGPT responses significantly outperformed doctors’ responses (t<sub>509</sub>=9.27, <italic>P</italic>&#60;.001), although both doctors’ responses (3.88, 95% CI 3.83-3.94) and ChatGPT responses (4.21, 95% CI 4.17-4.26) were rated at a “good” level. The proportion of low completeness responses was 3.66 times higher for doctors’ responses (6.7%, 95% 5.53%-8.97%) than for ChatGPT responses (1.8%, 95% CI 1.2%-2.6%); the proportion of high completeness responses was 1.20 times higher for ChatGPT responses (81.1%, 95% CI 79.2%-83.1%) than for doctors’ responses (67.4%, 95% CI 65.1%-69.7%). Pretrained models and structured outputs contributed to ChatGPT receiving more favor in this dimension.</p>
        <p>In the empathy dimension, ChatGPT responses were inferior to doctors’ responses (t<sub>511</sub>=2.19, <italic>P</italic>=.03). Due to the significance correction for multiple tests, we conservatively state that there is no significant difference between doctors’ responses (3.99, 95% CI 3.95-4.03) and ChatGPT responses (4.06, 95% 4.01-4.11). The proportion of low empathy responses was 1.12 times higher for ChatGPT responses (2.8%, 95% CI 2%-3.7%) than for doctors’ responses (2.5%, 95% 1.8%-3.4%), while the proportion of high empathy responses was 1.04 times higher for ChatGPT responses (75%, 95% CI 72.8%-77.1%) than for doctors’ responses (72%, 95% CI 69.6%-74.1%).</p>
        <p>In the accuracy dimension, there was not a significant difference between ChatGPT and doctors’ responses (t<sub>521</sub>=0.48, <italic>P</italic>=.63). Doctors’ responses (4.11, 95% CI 4.07-4.15) and ChatGPT responses (4.12, 95% CI 4.08-4.17) were comparable. The proportion of low accuracy responses was 2.2 times higher for ChatGPT responses (2.4%, 95% CI 1.7%-3.3%) than for doctors’ responses (1.1%, 95% CI 0.6%-1.7%), while the proportion of high-accuracy responses was 1.05 times higher for ChatGPT responses (81.1%, 95% CI 79%-83%) than for doctors’ responses (76.9%, 95% CI 74.7%-78.9%).</p>
      </sec>
      <sec>
        <title>Subgroup Comparisons</title>
        <sec>
          <title>Discrepancies in Evaluator Perspectives</title>
          <p>In terms of overall quality, physicians (<italic>P</italic>=.09) and patients (<italic>P</italic>=.88) perceived no difference between ChatGPT and doctors (<xref rid="figure2" ref-type="fig">Figure 2</xref>). Regarding completeness, physicians (t<sub>524</sub>=7.7, <italic>P</italic>&#60;.001) and patients (t<sub>508</sub>=8.0, <italic>P</italic>&#60;.001) unanimously agreed that ChatGPT outperformed doctors. On the empathy dimension, although physicians (t<sub>523</sub>=0.38, <italic>P</italic>=.70) did not perceive a difference between the two, patients believed that doctors’ responses exhibited more emotional depth than ChatGPT (t<sub>503</sub>=2.9, <italic>P</italic>=.003). In terms of accuracy, physicians (t<sub>496</sub>=2.3, <italic>P</italic>=.02) considered doctors’ responses to be more accurate, while patients believed that ChatGPT responses held a slight edge in accuracy (t<sub>520</sub>=3.3, <italic>P</italic>&#60;.001).</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Kernel density plot illustrating the overall quality assessment by (A) physicians and (B) patients, completeness assessment by (C) physicians and (D) patients, empathy assessment by (E) physicians and (F) patients, and accuracy assessment by (G) physicians and (H) patients.</p>
            </caption>
            <graphic xlink:href="jmir_v27i1e62857_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Differences in Responders' Performance</title>
          <p>We selected original questions (Q223-Q242) for which patients assisted doctors in crafting responses and found that, in this subset, doctors’ performance significantly surpassed that of ChatGPT (<italic>t</italic><sub>df</sub>=2.9, <italic>P</italic>=.006; <xref rid="figure3" ref-type="fig">Figure 3</xref>). In terms of overall quality and across various dimensions (<xref rid="figure4" ref-type="fig">Figure 4</xref>), ChatGPT’s ability to curate health information in the specialized field of medicine is now on par with professional doctors, reaching a level of excellence.</p>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Kernel density plot of the overall quality of the (A) original questions (Q223-Q242) for which patients assisted doctors in crafting responses and (B) all responses.</p>
            </caption>
            <graphic xlink:href="jmir_v27i1e62857_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>Kernel density plots showing assessors’ evaluations of (A) accuracy, (B) empathy, (C) completeness, and (D) overall quality.</p>
            </caption>
            <graphic xlink:href="jmir_v27i1e62857_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
      <sec>
        <title>Subdimension Correlation Analysis</title>
        <p>Using Pearson tests, a correlation analysis was conducted on the scores of ChatGPT responses across different text dimensions, revealing strong correlations between overall quality and other subdimensions (with empathy: r=0.842; with accuracy: r=0.839; with completeness: r=0.795). Additionally, there was a high correlation between accuracy and completeness among subdimensions (r=0.762; <xref rid="figure5" ref-type="fig">Figure 5</xref>). Similar patterns were observed in text responses from doctors, where overall quality exhibited correlations with completeness (r=0.857), with empathy (r=0.849), and with accuracy (0.828), and a correlation existed between accuracy and completeness (r=0.785; <xref rid="figure6" ref-type="fig">Figure 6</xref>).</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Correlation analysis of ChatGPT responses.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e62857_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Correlation analysis of doctors' responses.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e62857_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Readability Analysis</title>
        <p>A Mann-Whitney <italic>U</italic> test on the readability of responses from doctors (median: 7th grade; 1st quartile: 4th grade; 3rd quartile: 8th grade) and ChatGPT (median: 7th grade; 1st quartile: 7th grade; 3rd quartile: 8th grade) revealed no significant difference (<italic>P</italic>=.09; <xref rid="figure7" ref-type="fig">Figure 7</xref>).</p>
        <fig id="figure7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>An accordion plot illustrating significant fluctuations in the text editing abilities of the original doctors’ responses (median: 7th grade; 1st quarter: 4th grade; 3rd quarter: 8th grade).</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e62857_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>We introduced relatively novel methodologies and tools to form a viable framework for health information assessment. This cross-sectional study hypothesized that, in vertical fields like IBD, foundational LLMs such as ChatGPT-3.5 can perform comparably to domain experts in drafting health information and educating patients. Preliminary results suggest that using AI to assist with drafting or refining educational materials in patient education and popular science scenarios outside clinical consultations holds significant potential. This approach can address the challenges of limited physician time or expertise and bridge the gap of static information failing to meet the needs of patients with IBD. However, due to the current inability to eliminate AI hallucination phenomena, no matter how well LLMs perform, it is crucial to avoid unsupervised direct integration into patient care processes.</p>
      </sec>
      <sec>
        <title>Stable and Comprehensive: ChatGPT’s Health Information Output Capability</title>
        <p>High-quality health information contributes to favorable medical outcomes, especially for patients with chronic conditions [<xref ref-type="bibr" rid="ref12">12</xref>]. Conversely, erroneous, incomplete, and unregulated information may mislead patients into making detrimental choices [<xref ref-type="bibr" rid="ref13">13</xref>]. Exploring the application of LLMs in health information retrieval and chronic disease patient education holds significant practical relevance.</p>
        <p>Although the selection ratio did not exceed that of doctors to a statistically significant level, it is important to note that the latter are highly specialized professionals in the field of Chinese IBD and are endorsed by the expert association (Chinese IBD board) that follows them.</p>
        <p>However, ChatGPT’s responses are more comprehensive. From a selection of 12 fully optimized ChatGPT responses (partially referenced in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>), the advantages of ChatGPT are evident. Moreover, in the 5-level Likert scale evaluation, it significantly outperformed human experts. This stems from GPT’s structured approach based on preset models, featuring a brief introductory paragraph, followed by a list of answers with bullet points or numbering, and a standard concluding paragraph. In terms of accuracy and empathy, there were no significant differences between the two; however, there was a significant disparity in the completeness of responses between humans and GPT. Previous studies have found that GPT provides appropriate and easily understandable answers to questions regarding diagnosis and treatment choices but falls short when it comes to explaining diagnostic tests and recommending complex management strategies [<xref ref-type="bibr" rid="ref7">7</xref>]. Although its responses are structurally sound, they often lack critical insights into decision thresholds and treatment timing [<xref ref-type="bibr" rid="ref23">23</xref>]. Our IBD specialist physician (YC) provided a sharp critique: Its answers are superficial and lack sensitivity and understanding of medication efficacy and monitoring time frames. Interestingly, despite our blind randomized process, 2 evaluators admitted toward the end of the experiment that they could discern distinctly different styles between the 2 groups. Our study does not seem to support ChatGPT’s tendency to offer technically correct but insufficient textual conclusions [<xref ref-type="bibr" rid="ref23">23</xref>].</p>
        <p>From various visual distribution charts (<xref rid="figure2" ref-type="fig">Figures 2</xref>, 3, 4, and 6), it is evident that ChatGPT exhibits less score variance, indicating a more stable performance in this dimension. If you have ever coordinated a large group of people, compiling group publications and information without being able to control the format, you would deeply appreciate the commendable ability of LLMs in this regard. With an equal amount of learning material provided, machines produce more consistent outputs than humans.</p>
      </sec>
      <sec>
        <title>How to Make Others Understand (Whether They Are LLMs or Patients)</title>
        <p>In its official description, ChatGPT is merely a language model, pretrained for general cognitive tasks [<xref ref-type="bibr" rid="ref10">10</xref>]. Its performance may decrease when faced with tasks that require specialized and highly professional skills. Subsequent strategies include (1) using secondary LLMs tailored for various professional scenarios, such as Med-PalM [<xref ref-type="bibr" rid="ref33">33</xref>], and (2) application of prompt engineering.</p>
        <p>Prompt engineering, a concept that combines artistry and science [<xref ref-type="bibr" rid="ref10">10</xref>], led to a sudden realization in our experimental design, respecting the working principles of ChatGPT. LLMs are based on large-scale learning, reflecting the collective knowledge level of most learnable materials, implying that its understanding of information is based on widely applicable domains. However, our questions were based on the IBD community, sourcing information from a vertically specialized field. Specific contexts give rise to “slang” and a plethora of “terminology.” Broadly speaking, ChatGPT interpreting [激素] “hormones” as “chemical messengers between cells” is the most accurate, as outside of clinical contexts, such abbreviations are rarely used. When faced with unsatisfactory responses or doubts about AI hallucination, consider first whether the prompts (terminology) you provide as the initiating party have been broken down for laypersons to understand. In previous evaluations of English and Chinese IBD information [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref34">34</xref>], the readability levels of web health information were generally too high, making them unsuitable for public dissemination [<xref ref-type="bibr" rid="ref14">14</xref>]. Simultaneously, there are also articles indicating that the English output generated by ChatGPT is at a university level [<xref ref-type="bibr" rid="ref9">9</xref>]. This aligns with the common complaint heard by the authors in work settings from patients: Doctors chatter on, but I can’t understand a word they're saying. Explaining one term with another is not a joke but a satirical reality.</p>
        <p>In English health information research, readability analysis is commonplace. Common assessment tools include the Flesch-Reading Ease score and Flesch-Kincaid Grade Level [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. However, the analysis and application of Chinese readability are still in their infancy. We hope to see more experts from various industries, not just health care professionals, participate in such research and recognize the importance of information and its potential power. The popularity of “Q&#38;A on Ulcerative Colitis and Crohn's Disease” in the IBD community remains inexplicable, but we speculate that its readability matches the general educational levels of the Chinese population and the recommended grade level for popular science publications [<xref ref-type="bibr" rid="ref35">35</xref>]. Additionally, it is pleasantly surprising that the Chinese readability of ChatGPT’s response information is also very good, showing no significant difference from the level of professional doctors and exhibiting greater stability (narrower kernel density variance).</p>
        <p>In the cross-sectional comparison of subdimensions, we observed strong correlations between the overall quality of health information and completeness, accuracy, and empathy. Furthermore, there was a high predictive function between completeness and accuracy, as depicted in <xref rid="figure5" ref-type="fig">Figures 5</xref> and <xref rid="figure6" ref-type="fig">6</xref>, with a “more words, more reason” phenomenon. This same trend is confirmed in sensitivity analysis [<xref ref-type="bibr" rid="ref21">21</xref>]. Although each aspect can enhance the persuasiveness of textual information, empathy as an emotional dimension is not strongly correlated with rational dimensions such as accuracy and completeness.</p>
      </sec>
      <sec>
        <title>Disparities in Cognitive Understanding Between Patients and Health Care Providers</title>
        <p>In the overall comprehension of quality and completeness, it is evident that there was no disagreement among assessors in the roles of health care providers and patients. Both parties unanimously considered ChatGPT and medical experts to perform similarly, with the former providing more comprehensive information. However, upon conducting subgroup analysis, we discovered that health care providers have a delayed grasp on empathy and are more sensitive to accuracy. Health care providers can discern more accurately sourced information from their peers, while patients may not. These disparities form the foundation for the communication conflicts between health care providers and patients in real-life scenarios. Patients may not perceive ChatGPT’s information to be more erroneous than that of medical professionals, possibly due to their lack of professional knowledge to comprehend the underlying facts. This mirrors the headache-inducing situation for health care providers when patients prefer to believe exaggerated television advertisements for health products rather than opting for industry-reviewed experts and guidelines. This serves as a reminder that medical and health information must be developed and tested with patients (consumers) at the center [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
      </sec>
      <sec>
        <title>AI Hallucination</title>
        <p>Errors in responses from LLMs are referred to as “AI hallucination,” and chatbots typically present themselves in a convincing manner, leading the inquirer to potentially believe in their authenticity [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. We believe this is also a key reason why patient assessors cannot differentiate between the accuracy of ChatGPT and medical experts.</p>
        <p>Despite emphasizing the importance of prompt engineering, we are still amazed by ChatGPT’s ability to identify spelling errors, ambiguities, and highly condensed issues, based on our experimental responses structured as progressive inquiries following textbook content. As feedback, ChatGPT even comprehends outdated drug translations (eg, the new official translation [英夫利西单抗] for “infliximab” and the old term [英孚利昔单抗]). It also gave us a few “AI hallucinations” (correspondingly, numerous poorly performing outliers are evident in <xref rid="figure8" ref-type="fig">Figure 8</xref>), where commonly used drug names in clinical practice were interpreted as the scientific names of mosquitoes and, when questioned further, ChatGPT refused to acknowledge the error (<xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>). We attribute the causes of these AI delusions to a lack of background knowledge and insufficient prompts.</p>
        <fig id="figure8" position="float">
          <label>Figure 8</label>
          <caption>
            <p>The 3D scatter plot of the dimensions, showing a few instances of extremely low responses by ChatGPT on the left side of the plot and dense distribution of ChatGPT responses on the high completeness dimension.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e62857_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>In the realm of medicine, a discipline that relentlessly pursues zero errors as a necessity of natural science and ethics, allowing AI to engage in self-expression is inappropriate. Therefore, we also agree that it is imperative for professionals to verify the output of ChatGPT [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>], despite our observations indicating that it often performs at a level comparable to that of experts.</p>
      </sec>
      <sec>
        <title>Evaluating the Achievements of AI Should First Be Based on How Humans Assess Their Own Accomplishments</title>
        <p>Although ChatGPT may provide outdated or incorrect information, the level at which an LLM operates is a key consideration. Care should be taken when comparing ChatGPT with various experts or professional guidelines. Additionally, we must consider whether our human experts are capable of effectively dissecting and conveying complex, obscure, and uncommon terms and concepts to laypersons [<xref ref-type="bibr" rid="ref39">39</xref>]. Criticisms and warnings about LLMs are prevalent, reminding us of the need to contemplate the baseline definition of medical practice. Questions arise as to whether outputs need to strictly adhere to guidelines and if the discrepancies in guidelines among different countries, regions, and medical associations have been fully addressed. If not, evaluating LLMs or AI outputs will always involve subjective differences.</p>
        <p>Based on our findings, we cautiously endorse the view that ChatGPT has the potential to improve patients’ access to disease information in health care settings [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. Its performance may be even better when assessed by nonspecialist doctors or young medical students. If we were to compare humans to AI in the context of online community doctors, we speculate that the positive outcomes would be significantly pronounced [<xref ref-type="bibr" rid="ref21">21</xref>].</p>
      </sec>
      <sec>
        <title>Next Steps in Exploration</title>
        <p>To our knowledge, this study represents the first invitation for IBD health information consumers and providers to participate in a crowdsourced evaluation. It is also an exploration of the readability of simplified Chinese characters in the context of IBD.</p>
        <p>Introducing tools like ChatGPT into patient communities and basic patient education settings in a timely manner seems feasible: Initiating the use of ChatGPT to draft medical information for health care providers (health self-media practitioners, health care professionals, medical institution promoters), followed by expert review and refinement, appears to be a viable and convenient production pathway. Undoubtedly, the quality of ChatGPT’s responses will gradually improve with version updates and over time, making the tool even more promising [<xref ref-type="bibr" rid="ref40">40</xref>].</p>
        <p>Although not the primary hypothesis of our experiment, we also observed variations in text quality between different disease types generated by ChatGPT [<xref ref-type="bibr" rid="ref37">37</xref>]. Furthermore, ChatGPT has an overwhelming advantage over human experts in terms of speed of content creation. Many participating doctors acknowledge that crafting understandable content for patients in health education efforts requires significant dedication and effort [<xref ref-type="bibr" rid="ref41">41</xref>].</p>
        <p>Previously, on social media platforms and in online medical consultation scenarios, ChatGPT’s response capabilities have surpassed those of ordinary doctors in addressing common disease symptoms [<xref ref-type="bibr" rid="ref21">21</xref>]. However, in this study’s specialized vertical field (specifically referring to IBD specialization), professional doctors still demonstrate superior judgment and threshold control in information decision-making. We can speculate that LLMs have critical threshold points in disseminating information in specialized vertical fields. It is essential for us to identify these thresholds rationally: disseminating information to laypersons below the threshold and utilizing tools to assist professionals above the threshold.</p>
        <p>We envision a brighter future in health care, advocating for outstanding organizations (such as national cancer research centers or high-quality industry databases) to promote the dissemination of untainted high-quality data through independent reviews and exploration and subsequently leveraging digital tools like LLMs to share these data freely or affordably with patients, their families, and young doctors in need of accessing such information [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref39">39</xref>].</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <sec>
          <title>Tool and Method Selection</title>
          <p>In order to achieve a sufficient sample size for significant effects, we temporarily set aside the assessment of evaluator consistency and well-validated information tools such as Patient Education Materials Assessment Tool and DISCERN (not disregarding them) [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]. Compared with subjective crowdsourced rating strategies, these questionnaires or systems have relatively higher thresholds and specific use cases. Some researchers have suggested that certain health information assessment tools may not be universally suitable [<xref ref-type="bibr" rid="ref22">22</xref>]. If resources permit and the context is appropriate, we also recommend considering the simultaneous use of the aforementioned tools in the future and, when necessary, conducting accuracy assessments based on medical guidelines for evidence-based evaluation [<xref ref-type="bibr" rid="ref23">23</xref>].</p>
        </sec>
        <sec>
          <title>Reply Randomness and Answer Reproducibility</title>
          <p>Many researchers argue that a key limitation of the application and reproducibility of large-scale language models lies in the inherent randomness of their generated responses [<xref ref-type="bibr" rid="ref6">6</xref>]. This inherent randomness refers to the unpredictability of these models, primarily because they are trained on various text data and use probabilistic algorithms to generate answers. Even with multiple inputs of the same or similar content, this inherent randomness can lead to variations in the quality and accuracy of the outputs [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. However, some experiments suggest that repeating questions to ChatGPT multiple times results in excellent consistency of answers, reaching 90.48% to 100% [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. Our preliminary findings also indicate that, if the prompts are the same, although not identical in every aspect, the structure and substantive content of the responses from ChatGPT are generally similar (<xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>). Despite the aforementioned good reproducibility of ChatGPT, we have not yet fully overcome this limitation in our experiment.</p>
        </sec>
        <sec>
          <title>Model Version Changes</title>
          <p>The use of LLMs in patient education represents an interdisciplinary field at the intersection of medicine and technology. Large-scale AI language models possess the capability for improvement and learning, rendering similar research findings potentially outdated in a short span of time [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref40">40</xref>]. Just as we completed the compilation of responses in the second week, OpenAI released a new version. This is why we adhere to an open science approach, using publicly available and traceable materials as the textual sources for this comparison. Given improved conditions, we suggest that peers could build upon this foundation to conduct more comprehensive experiments or expand them into randomized controlled trials.</p>
        </sec>
        <sec>
          <title>Network Latency and Restrictions</title>
          <p>The blocking of ChatGPT in specific regions’ IP addresses (such as mainland China and Hong Kong) has added additional challenges to the use of this technology. High latency and instances of crashes have made the entire response process lengthy. Although these limitations indeed exist, they were not reflected in our results. Exceptional technology not only guides outstanding experimental outcomes but also relies on the accessibility and low barriers to entry of that technology. It is hoped that, in the future, all individuals, especially those in underdeveloped regions, can benefit from this technology. Gratitude is extended to OpenAI and ChatGPT 3.5 for their free and open-source demonstration of the allure of LLMs and the exploration of their application scenarios.</p>
          <p>As of the date of the revised manuscript, this limitation has been alleviated, with numerous outstanding general and specialized LLMs emerging in both China and the United States (eg, Baichuan, Qwen, LLaMA, Claude). Meanwhile, the use of ChatGPT-like alternative products for medical consultations and learning in broader health-related scenarios has gradually begun to be integrated into daily life.</p>
        </sec>
        <sec>
          <title>Current Limitations in Use Scenarios</title>
          <p>Countries worldwide have enacted citizen health information privacy protection measures [<xref ref-type="bibr" rid="ref35">35</xref>], such as China’s Personal Information Protection Law and the United States Health Insurance Portability and Accountability Act. Under current circumstances, we cannot and do not recommend researchers directly extract patient questions from patient communities, communication social media platforms (such as WeChat, WhatsApp), or outpatient settings to pose queries to ChatGPT. This is why, when considering the adoption of patient question sources, we collect authorized publications with management oversight.</p>
        </sec>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>In all dimensions, regardless of subjective or objective evaluation, ChatGPT demonstrated greater stability than human experts. When it came to responses to specialized medical questions, ChatGPT’s overall performance was on par with that of human specialist doctors. Its output of health information exhibited a better structural coherence, addressing the differentiation in outputs caused by cognitive and knowledge variations among individual specialist doctors. Using ChatGPT-3.5 to draft patient education materials, with doctors refining, supplementing, and proofreading the information, is acceptable and worth promoting. However, direct patient consultations and health education using ChatGPT are not feasible due to the presence of AI hallucinations. Differences in empathy and accuracy may exist between health care providers and patients. As primary consumers of health information, patients need to be involved in the creation and evaluation of health information. Before extensively applying LLMs in medical practice, more clinical trials and case studies are needed to assess their effectiveness and potential side effects. Ethical and privacy concerns, user training and education, and ongoing monitoring and evaluation are all issues that we need to consider and carefully deliberate.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Bilingual table of contents for Q&#38;A on Ulcerative Colitis and Crohn's Diseas</p>
        <media xlink:href="jmir_v27i1e62857_app1.docx" xlink:title="DOCX File , 35 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Co-authored original responses by doctors and patients.</p>
        <media xlink:href="jmir_v27i1e62857_app2.docx" xlink:title="DOCX File , 53 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Selected evaluation cases of responses.</p>
        <media xlink:href="jmir_v27i1e62857_app3.docx" xlink:title="DOCX File , 29 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Examples of AI hallucinations.</p>
        <media xlink:href="jmir_v27i1e62857_app4.docx" xlink:title="DOCX File , 21 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Examples of reproducibility responses.</p>
        <media xlink:href="jmir_v27i1e62857_app5.docx" xlink:title="DOCX File , 16 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CCCF</term>
          <def>
            <p>China Crohn’s and Colitis Foundation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CRIE</term>
          <def>
            <p>Chinese Readability Index Explorer</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">IBD</term>
          <def>
            <p>inflammatory bowel disease</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>We extend our sincere gratitude for the authorization provided by China Crohn’s and Colitis Foundation (CCCF) and Zhejiang University Press. We deeply appreciate the generous support from the Chinese Readability Index Explorer 3.0 team and the invaluable assistance of Tseng.</p>
      <p>Our heartfelt thanks go to the CCCF patient community and the 3 inflammatory bowel disease patient volunteers (HYC, XXQ, JMC) for their selfless dedication in participating in the assessment.</p>
      <p>The translation and editing of this article were facilitated by the translation and refinement features of ChatGPT.</p>
      <p>We thank openbiox community and Hiplot team [<xref ref-type="bibr" rid="ref44">44</xref>] for providing technical assistance and valuable tools for data analysis and visualization.</p>
      <p>This research was supported by the Qingfeng Scientific Research Fund of the CCCF under grant number CCCF-QF-2022A60-1.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>ZY had full access to all the data in the study and takes responsibility for the integrity of the data and the accuracy of the data analysis. ZY, YC, and YF conceived and designed the study. ZY, YY, DX, HW, and YC collected the data and assembled the facts. JM, HCT, THC, and YY transformed the data and provided technical support. ZY and YC drafted the manuscript. SL, YC, and YF critically revised the manuscript for important intellectual content. ZY and JL performed the statistical analysis. YC acquired funding. YC and YF provided administrative, technical, or material support. YC supervised the study.</p>
      </fn>
      <fn fn-type="conflict">
        <p>ZY previously acted as an Operations Coordinator at China Crohn’s and Colitis Foundation (CCCF), executing the public awareness campaign on inflammatory bowel disease (IBD) and playing a key role in organizing the knowledge base content for IBD patients.
      YC was the Chairman of CCCF.
      YC and YF contributed to the authoring of “Q&#38;A on Ulcerative Colitis and Crohn's Disease.”</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Musheyev</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bockelman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Loeb</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kabarriti</surname>
              <given-names>AE</given-names>
            </name>
          </person-group>
          <article-title>Assessment of artificial intelligence chatbot responses to top searched queries about cancer</article-title>
          <source>JAMA Oncol</source>
          <year>2023</year>
          <month>10</month>
          <day>01</day>
          <volume>9</volume>
          <issue>10</issue>
          <fpage>1437</fpage>
          <lpage>1440</lpage>
          <pub-id pub-id-type="doi">10.1001/jamaoncol.2023.2947</pub-id>
          <pub-id pub-id-type="medline">37615960</pub-id>
          <pub-id pub-id-type="pii">2808733</pub-id>
          <pub-id pub-id-type="pmcid">PMC10450581</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Ying</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT's potential role in non-English-speaking outpatient clinic settings</article-title>
          <source>Digit Health</source>
          <year>2023</year>
          <volume>9</volume>
          <fpage>20552076231184091</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/20552076231184091?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/20552076231184091</pub-id>
          <pub-id pub-id-type="medline">37434733</pub-id>
          <pub-id pub-id-type="pii">10.1177_20552076231184091</pub-id>
          <pub-id pub-id-type="pmcid">PMC10331772</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Dou</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Performance and exploration of ChatGPT in medical examination, records and education in Chinese: Pave the way for medical AI</article-title>
          <source>Int J Med Inform</source>
          <year>2023</year>
          <month>09</month>
          <volume>177</volume>
          <fpage>105173</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2023.105173</pub-id>
          <pub-id pub-id-type="medline">37549499</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(23)00191-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kung</surname>
              <given-names>TH</given-names>
            </name>
            <name name-style="western">
              <surname>Cheatham</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Medenilla</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sillos</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>De Leon</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Elepaño</surname>
              <given-names>Camille</given-names>
            </name>
            <name name-style="western">
              <surname>Madriaga</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Aggabao</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Diaz-Candido</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Maningo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tseng</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT on USMLE: potential for AI-assisted medical education using large language models</article-title>
          <source>PLOS Digit Health</source>
          <year>2023</year>
          <month>02</month>
          <volume>2</volume>
          <issue>2</issue>
          <fpage>e0000198</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36812645"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pdig.0000198</pub-id>
          <pub-id pub-id-type="medline">36812645</pub-id>
          <pub-id pub-id-type="pii">PDIG-D-22-00371</pub-id>
          <pub-id pub-id-type="pmcid">PMC9931230</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gorelik</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ghersin</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Maza</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Klein</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Harnessing language models for streamlined postcolonoscopy patient management: a novel approach</article-title>
          <source>Gastrointest Endosc</source>
          <year>2023</year>
          <month>10</month>
          <volume>98</volume>
          <issue>4</issue>
          <fpage>639</fpage>
          <lpage>641.e4</lpage>
          <pub-id pub-id-type="doi">10.1016/j.gie.2023.06.025</pub-id>
          <pub-id pub-id-type="medline">37385548</pub-id>
          <pub-id pub-id-type="pii">S0016-5107(23)02675-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jeblick</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Schachtner</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Dexl</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mittermeier</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Stüber</surname>
              <given-names>Anna Theresa</given-names>
            </name>
            <name name-style="western">
              <surname>Topalis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Weber</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wesp</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sabel</surname>
              <given-names>BO</given-names>
            </name>
            <name name-style="western">
              <surname>Ricke</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ingrisch</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT makes medicine easy to swallow: an exploratory case study on simplified radiology reports</article-title>
          <source>Eur Radiol</source>
          <year>2024</year>
          <month>05</month>
          <volume>34</volume>
          <issue>5</issue>
          <fpage>2817</fpage>
          <lpage>2825</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37794249"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s00330-023-10213-1</pub-id>
          <pub-id pub-id-type="medline">37794249</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00330-023-10213-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC11126432</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Henson</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Glissen Brown</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Leiman</surname>
              <given-names>DA</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of the potential utility of an artificial intelligence chatbot in gastroesophageal reflux disease management</article-title>
          <source>Am J Gastroenterol</source>
          <year>2023</year>
          <month>12</month>
          <day>01</day>
          <volume>118</volume>
          <issue>12</issue>
          <fpage>2276</fpage>
          <lpage>2279</lpage>
          <pub-id pub-id-type="doi">10.14309/ajg.0000000000002397</pub-id>
          <pub-id pub-id-type="medline">37410934</pub-id>
          <pub-id pub-id-type="pii">00000434-202312000-00031</pub-id>
          <pub-id pub-id-type="pmcid">PMC10834834</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>ZR</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Simard</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Linos</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Assessing biases in medical decisions via clinician and AI chatbot responses to patient vignettes</article-title>
          <source>JAMA Netw Open</source>
          <year>2023</year>
          <month>10</month>
          <day>02</day>
          <volume>6</volume>
          <issue>10</issue>
          <fpage>e2338050</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37847506"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2023.38050</pub-id>
          <pub-id pub-id-type="medline">37847506</pub-id>
          <pub-id pub-id-type="pii">2810775</pub-id>
          <pub-id pub-id-type="pmcid">PMC10582782</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Walker</surname>
              <given-names>HL</given-names>
            </name>
            <name name-style="western">
              <surname>Ghani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kuemmerli</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Nebiker</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>Beat Peter</given-names>
            </name>
            <name name-style="western">
              <surname>Raptis</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Staubli</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>Reliability of medical information provided by ChatGPT: assessment against clinical guidelines and patient information quality instrument</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <month>06</month>
          <day>30</day>
          <volume>25</volume>
          <fpage>e47479</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2023//e47479/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/47479</pub-id>
          <pub-id pub-id-type="medline">37389908</pub-id>
          <pub-id pub-id-type="pii">v25i1e47479</pub-id>
          <pub-id pub-id-type="pmcid">PMC10365578</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bubeck</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Petro</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Benefits, limits, and risks of GPT-4 as an AI chatbot for medicine</article-title>
          <source>N Engl J Med</source>
          <year>2023</year>
          <month>03</month>
          <day>30</day>
          <volume>388</volume>
          <issue>13</issue>
          <fpage>1233</fpage>
          <lpage>1239</lpage>
          <pub-id pub-id-type="doi">10.1056/NEJMsr2214184</pub-id>
          <pub-id pub-id-type="medline">36988602</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Madrigal</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Escoffery</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Electronic health behaviors among US adults with chronic disease: cross-sectional survey</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>03</month>
          <day>05</day>
          <volume>21</volume>
          <issue>3</issue>
          <fpage>e11240</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/3/e11240/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/11240</pub-id>
          <pub-id pub-id-type="medline">30835242</pub-id>
          <pub-id pub-id-type="pii">v21i3e11240</pub-id>
          <pub-id pub-id-type="pmcid">PMC6423466</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhi</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Health information on social media helps mitigate Crohn's disease symptoms and improves patients' clinical course</article-title>
          <source>Computers in Human Behavior</source>
          <year>2021</year>
          <month>02</month>
          <volume>115</volume>
          <fpage>106588</fpage>
          <pub-id pub-id-type="doi">10.1016/j.chb.2020.106588</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fortinsky</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Fournier</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Benchimol</surname>
              <given-names>EI</given-names>
            </name>
          </person-group>
          <article-title>Internet and electronic resources for inflammatory bowel disease: a primer for providers and patients</article-title>
          <source>Inflamm Bowel Dis</source>
          <year>2012</year>
          <month>06</month>
          <volume>18</volume>
          <issue>6</issue>
          <fpage>1156</fpage>
          <lpage>63</lpage>
          <pub-id pub-id-type="doi">10.1002/ibd.22834</pub-id>
          <pub-id pub-id-type="medline">22147497</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>XY</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>YW</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Qian</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Online information on Crohn's disease in Chinese: an evaluation of its quality and readability</article-title>
          <source>J Dig Dis</source>
          <year>2019</year>
          <month>11</month>
          <volume>20</volume>
          <issue>11</issue>
          <fpage>596</fpage>
          <lpage>601</lpage>
          <pub-id pub-id-type="doi">10.1111/1751-2980.12822</pub-id>
          <pub-id pub-id-type="medline">31583816</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bernard</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Langille</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hughes</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rose</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Leddin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Veldhuyzen van Zanten</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A systematic review of patient inflammatory bowel disease information resources on the World Wide Web</article-title>
          <source>Am J Gastroenterol</source>
          <year>2007</year>
          <month>09</month>
          <volume>102</volume>
          <issue>9</issue>
          <fpage>2070</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1572-0241.2007.01325.x</pub-id>
          <pub-id pub-id-type="medline">17511753</pub-id>
          <pub-id pub-id-type="pii">AJG1325</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Langille</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bernard</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rodgers</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hughes</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Leddin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>van Zanten</surname>
              <given-names>SV</given-names>
            </name>
          </person-group>
          <article-title>Systematic review of the quality of patient information on the internet regarding inflammatory bowel disease treatments</article-title>
          <source>Clin Gastroenterol Hepatol</source>
          <year>2010</year>
          <month>04</month>
          <volume>8</volume>
          <issue>4</issue>
          <fpage>322</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1016/j.cgh.2009.12.024</pub-id>
          <pub-id pub-id-type="medline">20060070</pub-id>
          <pub-id pub-id-type="pii">S1542-3565(09)01333-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mukewar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mani</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Lopez</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>YouTube and inflammatory bowel disease</article-title>
          <source>J Crohns Colitis</source>
          <year>2013</year>
          <month>06</month>
          <volume>7</volume>
          <issue>5</issue>
          <fpage>392</fpage>
          <lpage>402</lpage>
          <pub-id pub-id-type="doi">10.1016/j.crohns.2012.07.011</pub-id>
          <pub-id pub-id-type="medline">22906403</pub-id>
          <pub-id pub-id-type="pii">S1873-9946(12)00322-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>He</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Fang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>The reliability and quality of short videos as a source of dietary guidance for inflammatory bowel disease: cross-sectional study</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <month>02</month>
          <day>09</day>
          <volume>25</volume>
          <fpage>e41518</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2023//e41518/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/41518</pub-id>
          <pub-id pub-id-type="medline">36757757</pub-id>
          <pub-id pub-id-type="pii">v25i1e41518</pub-id>
          <pub-id pub-id-type="pmcid">PMC9951074</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Xue</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lv</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Internet and WeChat used by patients with Crohn's disease in China: a multi-center questionnaire survey</article-title>
          <source>BMC Gastroenterol</source>
          <year>2019</year>
          <month>06</month>
          <day>20</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>97</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcgastroenterol.biomedcentral.com/articles/10.1186/s12876-019-1011-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12876-019-1011-3</pub-id>
          <pub-id pub-id-type="medline">31221086</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12876-019-1011-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC6584988</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <source>The China Crohn's and Colitis Foundation</source>
          <year>2017</year>
          <month>06</month>
          <day>2</day>
          <access-date>2023-10-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mp.weixin.qq.com/s/L72X3B7vAHZba1O8ABYUnQ">https://mp.weixin.qq.com/s/L72X3B7vAHZba1O8ABYUnQ</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ayers</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Poliak</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dredze</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Leas</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Kelley</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Faix</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Goodman</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Longhurst</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Hogarth</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>Comparing physician and artificial intelligence chatbot responses to patient questions posted to a public social media forum</article-title>
          <source>JAMA Intern Med</source>
          <year>2023</year>
          <month>06</month>
          <day>01</day>
          <volume>183</volume>
          <issue>6</issue>
          <fpage>589</fpage>
          <lpage>596</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37115527"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamainternmed.2023.1838</pub-id>
          <pub-id pub-id-type="medline">37115527</pub-id>
          <pub-id pub-id-type="pii">2804309</pub-id>
          <pub-id pub-id-type="pmcid">PMC10148230</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yun</surname>
              <given-names>JY</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>EK</given-names>
            </name>
          </person-group>
          <article-title>A comprehensive evaluation of ChatGPT consultation quality for augmentation mammoplasty: a comparative analysis between plastic surgeons and laypersons</article-title>
          <source>Int J Med Inform</source>
          <year>2023</year>
          <month>11</month>
          <volume>179</volume>
          <fpage>105219</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1386-5056(23)00237-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2023.105219</pub-id>
          <pub-id pub-id-type="medline">37776670</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(23)00237-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yeo</surname>
              <given-names>YH</given-names>
            </name>
            <name name-style="western">
              <surname>Samaan</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>WH</given-names>
            </name>
            <name name-style="western">
              <surname>Ting</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Trivedi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Vipani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ayoub</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Liran</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Spiegel</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kuo</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Assessing the performance of ChatGPT in answering questions regarding cirrhosis and hepatocellular carcinoma</article-title>
          <source>Clin Mol Hepatol</source>
          <year>2023</year>
          <month>07</month>
          <volume>29</volume>
          <issue>3</issue>
          <fpage>721</fpage>
          <lpage>732</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36946005"/>
          </comment>
          <pub-id pub-id-type="doi">10.3350/cmh.2023.0089</pub-id>
          <pub-id pub-id-type="medline">36946005</pub-id>
          <pub-id pub-id-type="pii">cmh.2023.0089</pub-id>
          <pub-id pub-id-type="pmcid">PMC10366809</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="web">
          <source>ChatGPT</source>
          <access-date>2025-02-21</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://chat.openai.com/share/4be965cf-a024-4f8e-a438-a9064a1e0657">https://chat.openai.com/share/4be965cf-a024-4f8e-a438-a9064a1e0657</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van der Marel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Duijvestein</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hardwick</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>van den Brink</surname>
              <given-names>GR</given-names>
            </name>
            <name name-style="western">
              <surname>Veenendaal</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hommes</surname>
              <given-names>DW</given-names>
            </name>
            <name name-style="western">
              <surname>Fidder</surname>
              <given-names>HH</given-names>
            </name>
          </person-group>
          <article-title>Quality of web-based information on inflammatory bowel diseases</article-title>
          <source>Inflamm Bowel Dis</source>
          <year>2009</year>
          <month>12</month>
          <volume>15</volume>
          <issue>12</issue>
          <fpage>1891</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1002/ibd.20976</pub-id>
          <pub-id pub-id-type="medline">19462423</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="web">
          <source>Chinese Readability Index Explorer</source>
          <access-date>2025-02-21</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.chinesereadability.net/CRIE.">http://www.chinesereadability.net/CRIE</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sung</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Hsieh</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>CRIE: an automated analyzer for Chinese texts</article-title>
          <source>Behav Res Methods</source>
          <year>2016</year>
          <month>12</month>
          <volume>48</volume>
          <issue>4</issue>
          <fpage>1238</fpage>
          <lpage>1251</lpage>
          <pub-id pub-id-type="doi">10.3758/s13428-015-0649-1</pub-id>
          <pub-id pub-id-type="medline">26424442</pub-id>
          <pub-id pub-id-type="pii">10.3758/s13428-015-0649-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sung</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cha</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tseng</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Constructing and validating readability models: the method of integrating multilevel linguistic features with machine learning</article-title>
          <source>Behav Res Methods</source>
          <year>2015</year>
          <month>06</month>
          <volume>47</volume>
          <issue>2</issue>
          <fpage>340</fpage>
          <lpage>54</lpage>
          <pub-id pub-id-type="doi">10.3758/s13428-014-0459-x</pub-id>
          <pub-id pub-id-type="medline">24687843</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sung</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Dyson</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Leveling L2 texts through readability: combining multilevel linguistic features with the CEFR</article-title>
          <source>The Modern Language Journal</source>
          <year>2015</year>
          <month>07</month>
          <day>28</day>
          <volume>99</volume>
          <issue>2</issue>
          <fpage>371</fpage>
          <lpage>391</lpage>
          <pub-id pub-id-type="doi">10.1111/modl.12213</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tseng</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Sung</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Integrating LSA-based hierarchical conceptual space and machine learning methods for leveling the readability of domain-specific texts</article-title>
          <source>Nat. Lang. Eng</source>
          <year>2019</year>
          <month>04</month>
          <day>05</day>
          <volume>25</volume>
          <issue>3</issue>
          <fpage>331</fpage>
          <lpage>361</lpage>
          <pub-id pub-id-type="doi">10.1017/s1351324919000093</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Mao</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of the quality and readability of online information about breast cancer in China</article-title>
          <source>Patient Educ Couns</source>
          <year>2021</year>
          <month>04</month>
          <volume>104</volume>
          <issue>4</issue>
          <fpage>858</fpage>
          <lpage>864</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0738-3991(20)30510-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.pec.2020.09.012</pub-id>
          <pub-id pub-id-type="medline">32988687</pub-id>
          <pub-id pub-id-type="pii">S0738-3991(20)30510-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tseng</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of quality and readability of over-the-counter medication package inserts</article-title>
          <source>Res Social Adm Pharm</source>
          <year>2022</year>
          <month>09</month>
          <volume>18</volume>
          <issue>9</issue>
          <fpage>3560</fpage>
          <lpage>3567</lpage>
          <pub-id pub-id-type="doi">10.1016/j.sapharm.2022.03.012</pub-id>
          <pub-id pub-id-type="medline">35379561</pub-id>
          <pub-id pub-id-type="pii">S1551-7411(22)00088-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Singhal</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Azizi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mahdavi</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>HW</given-names>
            </name>
            <name name-style="western">
              <surname>Scales</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Tanwani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cole-Lewis</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Pfohl</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Payne</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Seneviratne</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gamble</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kelly</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Babiker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schärli</surname>
              <given-names>Nathanael</given-names>
            </name>
            <name name-style="western">
              <surname>Chowdhery</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mansfield</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Demner-Fushman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Agüera Y Arcas</surname>
              <given-names>Blaise</given-names>
            </name>
            <name name-style="western">
              <surname>Webster</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Matias</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chou</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gottweis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tomasev</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rajkomar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Barral</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Semturs</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Karthikesalingam</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Natarajan</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Large language models encode clinical knowledge</article-title>
          <source>Nature</source>
          <year>2023</year>
          <month>08</month>
          <volume>620</volume>
          <issue>7972</issue>
          <fpage>172</fpage>
          <lpage>180</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37438534"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41586-023-06291-2</pub-id>
          <pub-id pub-id-type="medline">37438534</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41586-023-06291-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC10396962</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baker</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Marshall</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>GL</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Lobo</surname>
              <given-names>AJ</given-names>
            </name>
          </person-group>
          <article-title>A systematic review of internet decision-making resources for patients considering surgery for ulcerative colitis</article-title>
          <source>Inflamm Bowel Dis</source>
          <year>2017</year>
          <month>08</month>
          <volume>23</volume>
          <issue>8</issue>
          <fpage>1293</fpage>
          <lpage>1300</lpage>
          <pub-id pub-id-type="doi">10.1097/MIB.0000000000001198</pub-id>
          <pub-id pub-id-type="medline">28708807</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>Xinhua News Agency</collab>
          </person-group>
          <article-title>Personal Information Protection Law of the People's Republic of China</article-title>
          <source>China Government Network</source>
          <year>2021</year>
          <month>08</month>
          <day>20</day>
          <access-date>2023-10-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.gov.cn/xinwen/2021-08/20/content_5632486.htm">https://www.gov.cn/xinwen/2021-08/20/content_5632486.htm</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Coulter</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Entwistle</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Gilbert</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Sharing decisions with patients: is the information good enough?</article-title>
          <source>BMJ</source>
          <year>1999</year>
          <month>01</month>
          <day>30</day>
          <volume>318</volume>
          <issue>7179</issue>
          <fpage>318</fpage>
          <lpage>22</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/9924064"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.318.7179.318</pub-id>
          <pub-id pub-id-type="medline">9924064</pub-id>
          <pub-id pub-id-type="pmcid">PMC1114785</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Dobbs</surname>
              <given-names>TD</given-names>
            </name>
            <name name-style="western">
              <surname>Hutchings</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Whitaker</surname>
              <given-names>IS</given-names>
            </name>
          </person-group>
          <article-title>Using ChatGPT to write patient clinic letters</article-title>
          <source>Lancet Digit Health</source>
          <year>2023</year>
          <month>04</month>
          <volume>5</volume>
          <issue>4</issue>
          <fpage>e179</fpage>
          <lpage>e181</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2589-7500(23)00048-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S2589-7500(23)00048-1</pub-id>
          <pub-id pub-id-type="medline">36894409</pub-id>
          <pub-id pub-id-type="pii">S2589-7500(23)00048-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Patterson</surname>
              <given-names>BL</given-names>
            </name>
            <name name-style="western">
              <surname>Wanderer</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Turer</surname>
              <given-names>RW</given-names>
            </name>
            <name name-style="western">
              <surname>Nelson</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>McCoy</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Sittig</surname>
              <given-names>DF</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Using AI-generated suggestions from ChatGPT to optimize clinical decision support</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2023</year>
          <month>06</month>
          <day>20</day>
          <volume>30</volume>
          <issue>7</issue>
          <fpage>1237</fpage>
          <lpage>1245</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37087108"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocad072</pub-id>
          <pub-id pub-id-type="medline">37087108</pub-id>
          <pub-id pub-id-type="pii">7136722</pub-id>
          <pub-id pub-id-type="pmcid">PMC10280357</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Butte</surname>
              <given-names>AJ</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence-from starting pilots to scalable privilege</article-title>
          <source>JAMA Oncol</source>
          <year>2023</year>
          <month>10</month>
          <day>01</day>
          <volume>9</volume>
          <issue>10</issue>
          <fpage>1341</fpage>
          <lpage>1342</lpage>
          <pub-id pub-id-type="doi">10.1001/jamaoncol.2023.2867</pub-id>
          <pub-id pub-id-type="medline">37615950</pub-id>
          <pub-id pub-id-type="pii">2808732</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Goodman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Patrinely</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stone</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zimmerman</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Donald</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Berkowitz</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Finn</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jahangir</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Scoville</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Reese</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bastarache</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>van der Heijden</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Carter</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Alexander</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Choe</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chastain</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zic</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Horst</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Turker</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Agarwal</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Osmundson</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Idrees</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kieman</surname>
              <given-names>Colleen</given-names>
            </name>
            <name name-style="western">
              <surname>Padmanabhan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bailey</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Schlegel</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chambless</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gibson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Osterman</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wheless</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Assessing the accuracy and reliability of AI-generated medical responses: an evaluation of the Chat-GPT model</article-title>
          <source>Res Sq</source>
          <year>2023</year>
          <month>02</month>
          <day>28</day>
          <fpage>1</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36909565"/>
          </comment>
          <pub-id pub-id-type="doi">10.21203/rs.3.rs-2566942/v1</pub-id>
          <pub-id pub-id-type="medline">36909565</pub-id>
          <pub-id pub-id-type="pii">rs.3.rs-2566942</pub-id>
          <pub-id pub-id-type="pmcid">PMC10002821</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ayre</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mac</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>McCaffery</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>McKay</surname>
              <given-names>BR</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rezwan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dunn</surname>
              <given-names>AG</given-names>
            </name>
          </person-group>
          <article-title>New frontiers in health literacy: using ChatGPT to simplify health information for people in the community</article-title>
          <source>J Gen Intern Med</source>
          <year>2024</year>
          <month>03</month>
          <volume>39</volume>
          <issue>4</issue>
          <fpage>573</fpage>
          <lpage>577</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37940756"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11606-023-08469-w</pub-id>
          <pub-id pub-id-type="medline">37940756</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11606-023-08469-w</pub-id>
          <pub-id pub-id-type="pmcid">PMC10973278</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Charnock</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Shepperd</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Needham</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gann</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>DISCERN: an instrument for judging the quality of written consumer health information on treatment choices</article-title>
          <source>J Epidemiol Community Health</source>
          <year>1999</year>
          <month>02</month>
          <day>01</day>
          <volume>53</volume>
          <issue>2</issue>
          <fpage>105</fpage>
          <lpage>11</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jech.bmj.com/lookup/pmidlookup?view=long&#38;pmid=10396471"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/jech.53.2.105</pub-id>
          <pub-id pub-id-type="medline">10396471</pub-id>
          <pub-id pub-id-type="pmcid">PMC1756830</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shoemaker</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wolf</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Brach</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Development of the Patient Education Materials Assessment Tool (PEMAT): a new measure of understandability and actionability for print and audiovisual patient information</article-title>
          <source>Patient Educ Couns</source>
          <year>2014</year>
          <month>09</month>
          <volume>96</volume>
          <issue>3</issue>
          <fpage>395</fpage>
          <lpage>403</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/24973195"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.pec.2014.05.027</pub-id>
          <pub-id pub-id-type="medline">24973195</pub-id>
          <pub-id pub-id-type="pii">S0738-3991(14)00233-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC5085258</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="web">
          <source>Hiplot</source>
          <access-date>2025-02-21</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://hiplot.org">https://hiplot.org</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
