<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v28i1e83051</article-id>
      <article-id pub-id-type="pmid">41707180</article-id>
      <article-id pub-id-type="doi">10.2196/83051</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Developing a Service Quality Index System for AI Health Care Chatbots: Mixed Methods Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Stone</surname>
            <given-names>Alicia</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Al-Tehewy</surname>
            <given-names>Mahi Mahmoud</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Malas</surname>
            <given-names>Kathy</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Gu</surname>
            <given-names>Yu</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>School of Medical Technology</institution>
            <institution>Capital Medical University</institution>
            <addr-line>No 10 Xi Toutiao Road</addr-line>
            <addr-line>Beijing, 100069</addr-line>
            <country>China</country>
            <phone>86 81476234</phone>
            <email>bitguyu@126.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9917-4809</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Xinyi</given-names>
          </name>
          <degrees>BA</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0009-1533-5827</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>School of Medical Technology</institution>
        <institution>Capital Medical University</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Yu Gu <email>bitguyu@126.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2026</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>18</day>
        <month>2</month>
        <year>2026</year>
      </pub-date>
      <volume>28</volume>
      <elocation-id>e83051</elocation-id>
      <history>
        <date date-type="received">
          <day>28</day>
          <month>8</month>
          <year>2025</year>
        </date>
        <date date-type="rev-request">
          <day>24</day>
          <month>10</month>
          <year>2025</year>
        </date>
        <date date-type="accepted">
          <day>30</day>
          <month>12</month>
          <year>2025</year>
        </date>
      </history>
      <copyright-statement>©Yu Gu, Xinyi Wang. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 18.02.2026.</copyright-statement>
      <copyright-year>2026</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2026/1/e83051" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Artificial intelligence (AI) health care chatbots are gaining widespread adoption worldwide. It is imperative to understand the service quality of AI health care chatbots. However, there is limited guidance on how to comprehensively evaluate their service quality.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to develop an index system based on the SERVQUAL framework for evaluating the service quality of AI health care chatbots.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>An initial indicator pool was compiled through a comprehensive literature review and consultations with 4 experts. These indicators were mapped and categorized into 5 domains adapted from the SERVQUAL framework. The experts were recruited from hospital, university, and health commission settings by purposive sampling. The service quality index system was identified using a 2-round Delphi process, which included a virtual meeting between the 2 rounds. In the third round, indicator weights within each quality domain and subdomain were determined using the analytic hierarchy process.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>There were 26 indicators identified in the literature, based on which the 2-round Delphi process was conducted. A total of 20 experts were invited. The response rates in both rounds of Delphi and the analytic hierarchy process were 100%, and the authoritative coefficients were both &#62;0.7. The final service quality index system for AI health care chatbots comprises 5 primary indicators and 17 secondary indicators. There were 3 (18%) indicators on assurance, 4 (24%) on reliability, 3 (18%) on human-likeness, 4 (24%) on tangibility, and 3 (18%) on responsiveness. The primary indicators, ranked from highest to lowest weight, were assurance (0.239), reliability (0.237), human-likeness (0.187), tangibility (0.170), and responsiveness (0.167).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This study pioneers the development of a service quality index system for AI health care chatbots adapted from the SERVQUAL framework. The results provide a validated tool for evaluating the performance of chatbots and offer valuable insights for health service managers and developers to enhance AI-driven medical consultation services.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>artificial intelligence health care chatbot</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>AI</kwd>
        <kwd>service quality</kwd>
        <kwd>Delphi method</kwd>
        <kwd>analytic hierarchy process</kwd>
        <kwd>index system development</kwd>
        <kwd>SERVQUAL</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Worldwide, artificial intelligence (AI) chatbots have been introduced into health care settings in recent years, where they are used by individuals as AI physicians for online medical consultations. A key innovation of AI health care chatbots lies in their ability to generate humanlike, natural language responses to diverse health-related queries anytime and anywhere, significantly improving access to medical guidance for broader populations [<xref ref-type="bibr" rid="ref1">1</xref>]. Unlike earlier rule-based chatbots that relied on scripted replies, AI chatbots leverage advanced technologies, such as large language models (LLMs), to deliver personalized and context-aware interactions [<xref ref-type="bibr" rid="ref2">2</xref>]. Moreover, the consultation service is often provided free of charge. AI health care chatbots show promise in delivering reliable medical advice without direct involvement from human physicians, offering a scalable solution to persistent challenges within the global health system, such as limited resources, uneven distribution, high costs, and growing demand [<xref ref-type="bibr" rid="ref3">3</xref>]. Therefore, AI health care chatbots are playing an increasingly important role in modern health care systems [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
      <p>AI health care chatbots represent not only a new type of service provider but also an innovative medical service model [<xref ref-type="bibr" rid="ref5">5</xref>]. As an emerging field, chatbots have attracted growing attention from both practitioners and researchers. Despite its potential benefits, concerns remain regarding its service quality [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. Efforts have been made to develop quality indicators for AI health care chatbots [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref16">16</xref>]. Some studies have evaluated response quality within specific disease contexts, such as labor epidurals, cardiovascular health, oncology, psoriasis, chronic hepatitis, and cancer [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. Others have focused on assessing information quality [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>] or have compared the performance of AI health care chatbots with that of human physicians [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref16">16</xref>]. However, existing studies primarily focus on narrow aspects of quality. Furthermore, the most commonly applied metrics—response accuracy, completeness, and consistency in closed-ended clinical questions—are predominantly defined from the health care providers’ perspective rather than that of users. Therefore, a comprehensive and user-centered index system for evaluating service quality of AI health care chatbots remains underdeveloped.</p>
      <p>Among existing service quality frameworks, SERVQUAL, developed by Parasuraman et al [<xref ref-type="bibr" rid="ref17">17</xref>], is one of the most widely recognized frameworks for evaluating medical service quality worldwide. This framework includes 5 dimensions—tangibility, reliability, responsiveness, assurance, and empathy—and is specifically designed to assess users’ expectations and perceptions of service quality [<xref ref-type="bibr" rid="ref18">18</xref>]. Applying this classical framework enables a more comprehensive and theoretically grounded evaluation of service quality of AI health care chatbots, bridging classical service quality theory with emerging AI-driven health care contexts.</p>
      <p>The aim of this study was to identify critical indicators that reflect the service quality of AI health care chatbots and to develop a scientifically feasible index system for its evaluation. The findings were expected to contribute to better identification of shortcomings, promote continuous quality improvement, enhance user experience, and offer new insights into the systemic evaluation of service quality of AI health care chatbots.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Study Design</title>
        <p>This study used a mixed methods approach, combining qualitative insights from expert opinions with quantitative metrics to develop and quantify a service quality index system for AI health care chatbots. The literature review and expert consultation were applied to construct an initial indicator pool. The 2-round Delphi consultation was then conducted to refine and establish the final index system. Subsequently, the analytic hierarchy process (AHP) was applied to determine the weight of each indicator. The process of index system development and weight determination is shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>The research process. AHP: analytic hierarchy process.</p>
          </caption>
          <graphic xlink:href="jmir_v28i1e83051_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Initial Indicator Pool</title>
        <p>The initial indicator pool was compiled based on existing literature and expert opinions. A comprehensive systematic literature search was conducted in 4 databases: PubMed, Web of Science, China National Knowledge Infrastructure, and Wanfang Data. The search strategy incorporated the following key terms: [“chatbot*” OR “chat-bot*” OR “conversational agent*” OR “conversational bot*” OR “conversational system*” OR “dialogue system*” OR ChatGPT] AND [“medic*” OR “health*” OR “disease*” OR “patient*”] AND [“quality indicator*” OR “quality evaluat*” OR “quality assess*” OR “quality measure*”]. Boolean operators (AND, OR, and NOT) were used to combine or refine search terms (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The exclusion criteria were as follows: (1) studies not focused on the evaluation of AI health care chatbots; (2) commentaries, protocols, letters, editorials, and conference abstracts; and (3) studies not published in English or Chinese.</p>
        <p>In the second phase, this study incorporated insights from 4 interdisciplinary experts specializing in intelligent health care and medical service management. These experts conducted in-depth discussions regarding the relevance, suitability, and validity of the preliminary indicators. None of them participated in the subsequent Delphi consultation rounds. Both prior literature and expert opinions emphasized that the SERVQUAL framework provides a user-centered foundation well suited for the evaluation of AI health care chatbots and highlighted anthropomorphism as a distinctive feature influencing perceived service quality in AI-driven interactions. Specifically, users desire AI health care chatbots to exhibit kindness through humanlike attributes, such as a name, image, and voice. Beyond a friendly appearance, users expect these systems to demonstrate social intelligence, including the ability to detect user emotions and respond with genuine concern, which goes beyond simple empathy. Furthermore, users expect personalized responses tailored to individual factors. Therefore, the <italic>humanlike</italic> dimension was introduced as an innovative replacement for the traditional “empathy” construct to better capture the emotional and interactive capabilities unique to AI health care chatbots. Accordingly, this study established 5 first-level indicators adapted from the SERVQUAL structure: tangibility, responsiveness, assurance, human-likeness, and reliability, and 26 second-level indicators were included in the initial pool.</p>
      </sec>
      <sec>
        <title>Expert Selection</title>
        <p>The initial expert recruitment was conducted through recommendations from our collaborators in the field of intelligent health care. They were from renowned universities, tertiary hospitals, and provincial health sectors. To broaden the reach and ensure a diverse range of perspectives, the experts initially nominated by the researchers were then asked to suggest other qualified individuals who could contribute valuable insights to the study. The inclusion criteria for experts were as follows: (1) familiarity with research areas, such as intelligent health care, medical service management, health information management, and other related fields; (2) more than 5 years of professional experience in a relevant field; and (3) willingness to actively participate in the study and provide timely responses across multiple rounds of Delphi consultation. Finally, a total of 20 experts were recruited through purposive sampling.</p>
      </sec>
      <sec>
        <title>Delphi Process</title>
        <p>The Delphi method is a structured communication technique designed to systematically collect expert opinions and achieve consensus [<xref ref-type="bibr" rid="ref19">19</xref>]. It has been widely applied and validated as a robust research methodology in health care contexts [<xref ref-type="bibr" rid="ref20">20</xref>]. This study conducted a 2-round Delphi consultation to screen, refine, and finalize the indicators.</p>
        <p>The Delphi consultation questionnaire consists of 2 main sections: an informed consent form and the main survey. The informed consent form outlined the study’s background, objectives, methodology, privacy protection measures, and contact information. The main survey collected information from five areas: (1) experts’ basic information, including age, education, and years of work experience; (2) the core consultation content, in which experts scored the importance and feasibility of each indicator using a 10-point scale (1=lowest and 10=highest); (3) the familiarity scale, rated by the expert themselves using a 5-point Likert scale (1=very unfamiliar and 5=very familiar); (4) the basis of expert judgment, evaluating the impact of theoretical analysis, practical experience, literature knowledge, and instinct on scoring (rated as high, medium, or low); and (5) blank fields, allowing experts to propose additions, deletions, or modifications to the indicators. All experts completed the informed consent process, and strict confidentiality was maintained throughout the entire process.</p>
        <p>The Delphi process was conducted between February 2025 and June 2025. In the first round, Delphi questionnaires in Microsoft Word format were distributed to 20 experts, with a 2-week response period. Experts were asked to rate both the primary and secondary indicators and to provide comments. On the basis of the results and comments from the first round, the questionnaire was revised and redistributed to the same 20 experts for the second round. The second round followed the same rating procedure as the first and achieved consensus among the experts.</p>
      </sec>
      <sec>
        <title>Indicator Selection</title>
        <p>To screen the indicators, this study used 3 important statistics: the mean importance score, the full-mark rate (proportion of experts assigning the highest score), and the coefficient of variation. The inclusion criteria were as follows: (1) a mean of importance score ≥7.0, (2) a full-mark rate &#62;20%, and (3) a coefficient of variation &#60;0.25 [<xref ref-type="bibr" rid="ref21">21</xref>-<xref ref-type="bibr" rid="ref23">23</xref>]. Any indicator failing to meet all 3 criteria was subject to deletion or revision based on panel discussion and qualitative feedback.</p>
      </sec>
      <sec>
        <title>AHP Procedure</title>
        <p>Following the 2-round Delphi consultation, the final set of indicators was confirmed. The same panel of experts was then invited to participate in a pairwise comparison process to determine indicator weights. For each pair of indicators within the same hierarchical level, judgment matrices were constructed using a 1 to 9 ordinal scale to assess their relative importance [<xref ref-type="bibr" rid="ref24">24</xref>]. The weight of each indicator was subsequently calculated using the percentage weighting method based on the pairwise comparison matrices, with higher weight values indicating greater perceived importance.</p>
      </sec>
      <sec>
        <title>Data Analysis</title>
        <p>Statistical analysis was conducted using SPSS software (version 25.0; IBM Corp). The authority coefficient (Cr) represents the authority level of experts. Cr was the arithmetic mean of the experts’ judgment coefficient (Ca) and the experts’ familiarity coefficient (Cs) [<xref ref-type="bibr" rid="ref25">25</xref>]. A Cr value ≥0.7 was considered acceptable [<xref ref-type="bibr" rid="ref26">26</xref>]. The Ca value was derived from experts’ self-assessment of their own judgment criteria, as detailed in <xref ref-type="table" rid="table1">Table 1</xref>. The Cs value ranges from 1.0 (very familiar) to 0.2 (unfamiliar). The coordination of expert opinions was tested using the Kendall coefficient of concordance (Kendall <italic>W</italic>), with a significance level of α=.05. YAAHP software (version 11.2; MetaDecision) was used to calculate the indicator weights and assess the consistency ratio. When the consistency ratio value was &#60;0.10, it was considered acceptable, indicating sufficient consistency in expert judgments [<xref ref-type="bibr" rid="ref27">27</xref>].</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>The judgment basis and degree of influence.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td>Judgment basis</td>
                <td colspan="3">Degree of impact on experts’ judgment</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>High</td>
                <td>Medium</td>
                <td>Low</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Theoretical analysis</td>
                <td>0.3</td>
                <td>0.2</td>
                <td>0.1</td>
              </tr>
              <tr valign="top">
                <td>Practical experience</td>
                <td>0.5</td>
                <td>0.4</td>
                <td>0.3</td>
              </tr>
              <tr valign="top">
                <td>Reference literature</td>
                <td>0.1</td>
                <td>0.1</td>
                <td>0.1</td>
              </tr>
              <tr valign="top">
                <td>Expert intuition</td>
                <td>0.1</td>
                <td>0.1</td>
                <td>0.1</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>The study protocol was approved by the Ethics Committee of the Capital Medical University, Beijing, China (2025SY-071). Participants were informed of the study’s purpose and procedure. Online informed consent was obtained from each participant. All research data were stored on a password-encrypted computer, and only the researchers had access to the data. No compensation was provided to participants.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Characteristics of Experts</title>
        <p>A total of 20 experts completed the 2-round Delphi consultation and AHP evaluation. The panel consisted of 12 (60%) male and 8 (40%) female experts, ranging in age from 31 to 60 years. Among the experts, 17 (85%) held a master’s degree or higher. All experts possessed associate senior professional titles or higher. The panel included 10 (50%) experts from quality control departments of hospitals, 7 (35%) from universities, and 3 (15%) from national or regional health commissions. The detailed characteristics of these experts are summarized in <xref ref-type="table" rid="table2">Table 2</xref>.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>The characteristics of the Delphi consultation experts (N=20).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="670"/>
            <col width="300"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Characteristics</td>
                <td>Experts, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">
                  <bold>Sex</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td>12 (60)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td>8 (40)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Age (years)</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>31-40</td>
                <td>6 (30)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>41-50</td>
                <td>11 (55)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>51-60</td>
                <td>3 (15)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Education</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Doctoral degree</td>
                <td>10 (60)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Master’s degree</td>
                <td>7 (35)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bachelor’s degree</td>
                <td>3 (15)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Professional</bold>
                  <bold>title</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Senior</td>
                <td>11 (55)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Associate senior</td>
                <td>9 (45)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Seniority (years)</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>6-10</td>
                <td>4 (20)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>11-20</td>
                <td>9 (45)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>21-30</td>
                <td>5 (25)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&#62;30</td>
                <td>2 (10)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Affiliation</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hospitals</td>
                <td>10 (50)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Universities</td>
                <td>7 (35)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Health commission</td>
                <td>3 (15)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Field of expertise</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Intelligent health care</td>
                <td>8 (40)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Medical service management</td>
                <td>7 (35)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Health information management</td>
                <td>5 (25)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Authority Coefficient and Degree of Coordination</title>
        <p>The Cr values for the first and second rounds of the Delphi consultation were 0.894 (Ca=0.931; Cs=0.847) and 0.919 (Ca=0.917; Cs=0.921), respectively (<xref ref-type="table" rid="table3">Table 3</xref>). Both values exceed the accepted threshold of 0.7, indicating a high level of expert credibility and reinforcing the reliability of the consultation results.</p>
        <p>The Kendall <italic>W</italic> coefficients for the 2 consultation rounds are shown in <xref ref-type="table" rid="table3">Table 3</xref>. After the second round, the coordination coefficients of the indicator increased from 0.263 to 0.339, and all associated <italic>P</italic> values were &#60;.001, indicating that the experts’ opinions converged and that the degree of consensus among experts was acceptable.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Expert authority coefficients and the degree of coordination of expert opinions.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="150"/>
            <col width="130"/>
            <col width="140"/>
            <col width="140"/>
            <col width="160"/>
            <col width="140"/>
            <col width="140"/>
            <thead>
              <tr valign="bottom">
                <td>Round</td>
                <td>Ca<sup>a</sup></td>
                <td>Cs<sup>b</sup></td>
                <td>Cr<sup>c</sup></td>
                <td>Kendall <italic>W</italic></td>
                <td>Chi-square (<italic>df</italic>)</td>
                <td><italic>P</italic> value</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Round 1</td>
                <td>0.931</td>
                <td>0.847</td>
                <td>0.894</td>
                <td>0.263</td>
                <td>71.1 (25)</td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>Round 2</td>
                <td>0.917</td>
                <td>0.921</td>
                <td>0.919</td>
                <td>0.339</td>
                <td>123.2 (20)</td>
                <td>&#60;.001</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>Cs: familiarity coefficient.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>Ca: judgment coefficient.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>Cr: authority coefficient.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Review for Initial Indicator Pool</title>
        <p>The database search and hand searches identified 117 articles, from which 48 (41.0%) duplicates were removed. After screening the titles and abstracts, 29 (24.8%) full-text records were reviewed, of which 20 (17.1%) were included in the review [<xref ref-type="bibr" rid="ref28">28</xref>-<xref ref-type="bibr" rid="ref47">47</xref>]. The study selection process is illustrated in <xref rid="figure2" ref-type="fig">Figure 2</xref>.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Flowchart of the included studies.</p>
          </caption>
          <graphic xlink:href="jmir_v28i1e83051_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>In the 20 eligible studies, 9 (45%) focused exclusively on AI chatbots designed specifically for health care service [<xref ref-type="bibr" rid="ref28">28</xref>-<xref ref-type="bibr" rid="ref36">36</xref>]. To develop a comprehensive initial indicator pool, we also included 11 additional studies concerning the quality of general AI chatbots capable of delivering health care–related consultations [<xref ref-type="bibr" rid="ref37">37</xref>-<xref ref-type="bibr" rid="ref47">47</xref>]. Of these, 6 (30%) studies aimed to develop instruments for measuring the overall service quality of AI chatbots [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref40">40</xref>], with 2 (10%) grounded in the SERVQUAL model [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. Another 7 (35%) studies developed instruments targeting specific dimensions of quality [<xref ref-type="bibr" rid="ref30">30</xref>-<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref42">42</xref>]. Additionally, 7 (35%) studies treated quality as a key determinant of acceptance or satisfaction with AI chatbots and provided detailed measurement items for AI chatbot quality [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref43">43</xref>-<xref ref-type="bibr" rid="ref47">47</xref>]. Following a systematic sorting process and discussions with 4 domain experts, we synthesized these findings into an initial pool of 26 second-level indicators for assessing the quality of AI health care chatbots, structured according to the 5 dimensions of the SERVQUAL framework.</p>
      </sec>
      <sec>
        <title>Indicator Selection</title>
        <p>According to the indicator selection criteria and qualitative feedback from the experts, from a total of 26 indicators, 5 (19%) secondary indicators were removed and 21 (81%) were retained in the first round. Between round 1 and round 2, a virtual Delphi meeting was held to discuss indicators for which experts provided revision suggestions and to identify novel indicators based on perceived gaps in current indicators. Experts who had completed round 1 attended the meeting. During this panel meeting, 8 (31%) secondary indicators were merged into 4 (15%) indicators. Following the discussion, 20 experts rated the new indicators. Finally, the 2-round Delphi process reached a finalized evaluation framework comprising 5 (19%) primary indicators and 17 (65%) secondary indicators, each clearly defined in <xref ref-type="table" rid="table4">Table 4</xref>.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>The service quality index system for artificial intelligence (AI) health care chatbots.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="220"/>
            <col width="640"/>
            <col width="110"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Indicator</td>
                <td>Definition</td>
                <td>Weights</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">
                  <bold>Assurance</bold>
                </td>
                <td>The ability of AI health care chatbots to provide pertinent responses</td>
                <td>0.239</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Understandable answer</td>
                <td>The AI health care chatbots provide an answer with a logistical structure and the right amount of information to the user’s query</td>
                <td>0.082</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Accurate understanding</td>
                <td>The AI health care chatbots understand the exact meaning of the content sent by the user in text and voice</td>
                <td>0.079</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Targeted question</td>
                <td>The AI health care chatbots ask follow-up questions with context awareness based on the user’s query</td>
                <td>0.078</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Reliability</bold>
                </td>
                <td>The ability of AI health care chatbots to inspire trust and confidence</td>
                <td>0.237</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Trustworthy advice</td>
                <td>The AI health care chatbots give medical advice, such as diagnosis, medication, and examination, and detailed explanations, which are consistent across multiple inquiries</td>
                <td>0.071</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Useful service</td>
                <td>The AI health care chatbots are useful in addressing users’ uncertainties about their health concerns</td>
                <td>0.065</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Specific risk warning</td>
                <td>The AI health care chatbots clearly indicate the limitations of its provided answers</td>
                <td>0.050</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Protected privacy</td>
                <td>The AI health care chatbots protect the user’s privacy</td>
                <td>0.051</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Human-likeness</bold>
                </td>
                <td>The social cue, personality, and empathy of AI health care chatbots</td>
                <td>0.187</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Personalized response</td>
                <td>The AI health care chatbots tailor their answers according to the user’s age, sex, and medical history</td>
                <td>0.064</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Emotional attention</td>
                <td>The AI health care chatbots detect user emotion and makes the user feel concerned</td>
                <td>0.063</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Kind characteristic</td>
                <td>The AI health care chatbots have a kind name, image, and voice</td>
                <td>0.060</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Tangibility</bold>
                </td>
                <td>The hardware or software manifestations of AI health care chatbots</td>
                <td>0.170</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Accurate recognition</td>
                <td>The AI health care chatbots recognize and transfer the speech of the users into accurate text</td>
                <td>0.046</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Compatible operation</td>
                <td>It is convenient for the user to obtain the service of AI health care chatbots on a mobile app, WeChat mini program, or website</td>
                <td>0.043</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Friendly layout</td>
                <td>The layout of AI health care chatbots is clear and easy to operate</td>
                <td>0.041</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Stable service</td>
                <td>The AI health care chatbots provide the same smooth service in any situation</td>
                <td>0.040</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Responsiveness</bold>
                </td>
                <td>The response ability of AI health care chatbots</td>
                <td>0.167</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Anytime response</td>
                <td>The AI health care chatbots are available 24 hours a day for 365 days</td>
                <td>0.043</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Prompt response</td>
                <td>The AI health care chatbots always give timely feedback when it is needed</td>
                <td>0.042</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Coherent response</td>
                <td>The AI health care chatbots can communicate with the user seamlessly by maintaining records within the personal account</td>
                <td> 0.042</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Indicator Weights</title>
        <p>On the basis of the AHP and percentage weighting method, the weights for all indicators were calculated (<xref ref-type="table" rid="table4">Table 4</xref>). The primary indicators, ranked from highest to lowest weight, were assurance (0.239), reliability (0.237), human-likeness (0.187), tangibility (0.170), and responsiveness (0.167). Assurance received the highest weight. For the secondary indicators, weights ranged from 0.040 to 0.082. “Understandable answer” had the highest secondary weight (0.082), followed by “Accurate understanding” (0.079), “Targeted question” (0.078), and “Trustworthy advice” (0.071).</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>The development of AI health care chatbots is on the rise, and their adoption is becoming increasingly vital in modern health care. Providing AI health care chatbots with high service quality is critical to facilitating their broader diffusion and addressing contemporary health care challenges. Although previous studies have attempted to evaluate the quality of AI chatbots in responding to queries related to specific diseases, a comprehensive and user-centered index system for evaluating the service quality of AI health care chatbots has remained lacking. To our knowledge, this is the first study to develop a comprehensive service quality index system for AI health care chatbots from a patient perspective, using SERVQUAL as the theoretical framework. Through a 2-round Delphi process, a finalized set of 5 primary indicators and 17 secondary indicators was derived, specifically designed to capture both the technical functionality and interactive experience unique to AI health care chatbots. Subsequently, the indicator weights were obtained using the AHP.</p>
        <p>Among the 5 primary indicators, assurance was identified as the most important dimension, which refers to the ability of AI health care chatbots to provide pertinent responses. Unlike consultations with a clinician, AI health care chatbots lack the capacity to perform physical examinations to support diagnosis. Therefore, it is essential for AI health care chatbots to deliver goal-oriented and unambiguous conversations, accurately understand user queries, ask follow-up questions with contextual awareness, and provide understandable answers [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref48">48</xref>]. Previous studies [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref10">10</xref>] have taken understandability, often reflected through situation-appropriate response length and information quantity, as a sole metric to measure the quality of AI health care chatbots. Consistent with this emphasis, the secondary indicator “Understandable answer” received the highest weight among secondary indicators. Although aspects such as completeness and consistency have been associated with answer readability in previous studies [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref48">48</xref>], they were not included in this framework. This omission stems from their highly specialized and profession-centric evaluation criteria, which may not align with patient-centered usability expectations.</p>
        <p>The reliability dimension ranked second, following assurance. Current AI technologies remain fallible and necessitate oversight by health professionals to ensure the applicability and safety advice of AI health care chatbots [<xref ref-type="bibr" rid="ref7">7</xref>]. For users, it is critical that AI health care chatbots provide not only trustworthy medical advice regarding diagnosis, medication, and examinations but also clear explanations that enhance transparency and facilitate informed decision-making, thereby fostering trust and promoting sustained engagement [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]. Both users and clinicians have underscored the importance of clearly indicating the limitations of AI-generated medical advice [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref5">5</xref>]. In contrast to earlier studies [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref49">49</xref>], this study deliberately excluded diagnostic accuracy, a frequently used metric, from this index system, as patients generally lack the specialized medical knowledge required to evaluate this aspect.</p>
        <p>The human-likeness dimension is considered a distinctive feature of AI health care chatbots [<xref ref-type="bibr" rid="ref1">1</xref>]. Although it is not ranked highest among the primary indicators, its associated secondary indicators, “Personalized response” and “Emotional attention,” had prominent weight values. Users often perceive AI health care chatbots as an “AI doctor” and tend to evaluate it through direct comparison with human clinicians along these dimensions [<xref ref-type="bibr" rid="ref3">3</xref>]. Enhancing humanlike attributes in interactions of AI health care chatbots remains a critical development objective. This entails increased efforts to enable AI health care chatbots to generate context-aware and individualized replies that adapt to both the conversational flow and user preferences [<xref ref-type="bibr" rid="ref29">29</xref>].</p>
        <p>The dimension of tangibility refers to hardware and software manifestations of AI health care chatbots. Among its secondary indicators, “Accurate recognition” was assigned the highest weight. As an information system designed to provide health guidance [<xref ref-type="bibr" rid="ref50">50</xref>], the accuracy of recognizing and transferring user speech into precise text is the basis for correctly interpreting user queries and facilitating subsequent consultation processes [<xref ref-type="bibr" rid="ref9">9</xref>]. The next important indicator, “Compatible operation,” reflects the accessibility of the service of AI health care chatbots across diverse digital environments. A previous study has emphasized that users valued the ability to access services of AI health care chatbots through various devices, such as smartphones, tablets, or computers, which supports broader and more equitable adoption [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
        <p>Although responsiveness is positioned as the final dimension in the framework, it constitutes a fundamental component of the service quality of AI health care chatbots [<xref ref-type="bibr" rid="ref5">5</xref>]. This dimension is characterized by the provision of active and uninterrupted guidance 24 hours a day, real-time responses without having to wait in line, immediate accessibility from any location without the need for travel, and seamless communication across different devices [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]. Given that AI health care chatbots are supported by LLMs, users perceive responsiveness as their inherent capability [<xref ref-type="bibr" rid="ref1">1</xref>].</p>
        <p>Overall, AI health care chatbots currently represent a viable alternative to human clinicians in initial user interactions [<xref ref-type="bibr" rid="ref2">2</xref>]. However, its performance can vary significantly depending on the underlying LLMs, knowledge bases, and health data used [<xref ref-type="bibr" rid="ref31">31</xref>]. While this study developed a service quality index system for AI health care chatbots based on the SERVQUAL framework, most secondary indicators in this study were newly developed to reflect the unique AI context. The proposed index system offers practical value for multiple stakeholders: it enables users to better understand and assess the strengths of AI health care chatbots; supports health service managers in systematically collecting feedback and monitoring performance; and guides developers in conducting feasibility analyses, optimizing design, and implementing postlaunch evaluation. Future research will involve applying this index system in field studies with users of AI health care chatbots to validate their utility and support its ongoing refinement.</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>The strengths of this study are as follows. First, this study developed a comprehensive evaluation index system by adapting a scientific framework that incorporates both internationally validated evidence-based indicators and unique features of AI health care chatbots. Second, the mixed methods approach, combining literature review, expert consultations, a 2-round Delphi process, and AHP, ensured a rigorous and systematic development process. Third, this study provides new insights into the systemic evaluation of service quality of AI health care chatbots.</p>
        <p>Several limitations should also be acknowledged. First, although the number of experts consulted met methodological requirements, it remained relatively limited. The panel may be subject to selection bias due to the experts’ familiarity with AI health care chatbots, which could influence the selection and weighting of indicators. Therefore, the scope of expert consultation needs to be further expanded to enhance the validity of the indicators. Second, all participating experts were based in China, which may limit the generalizability of the findings to other cultural or health system contexts. Future studies should validate the proposed evaluation index across a broader range of settings of AI health care chatbots. Third, this index system has not yet been operationalized and evaluated by the users of AI health care chatbots. Further empirical research is needed to demonstrate its practical relevance and utility and to consider incorporating patient experience into the assessment process. Furthermore, although Kendall <italic>W</italic> was statistically significant, its value reflects only a moderate level of consensus. This implies that the findings are robust but limited in microlevel ranking. In this study, experts from diverse professional backgrounds likely held different interpretations and assigned varying weights to the indicators, which may have led to evaluation discrepancies.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This study developed a comprehensive, user-centered index system for evaluating the service quality of AI health care chatbots. Through the Delphi method and the AHP, a finalized framework consisting of 5 primary dimensions and 17 secondary indicators was established. These include 4 indicators for tangibility, 3 for responsiveness, 3 for assurance, 3 for human-likeness, and 4 for reliability. This index system prioritizes user needs and experiences and can practically quantify the service quality of AI health care chatbots. The proposed index system will provide valuable support for health policymakers, service managers, and developers by enabling benchmark comparisons, facilitating quality monitoring, and guiding continuous service enhancement.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Search strategy.</p>
        <media xlink:href="jmir_v28i1e83051_app1.docx" xlink:title="DOCX File , 18 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AHP</term>
          <def>
            <p>analytic hierarchy process</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors attest that no generative artificial intelligence technologies were used in the generation of text, figures, or other informational content of this manuscript. The authors acknowledge all experts who participated in the Delphi process and the analytic hierarchy process.</p>
    </ack>
    <notes>
      <title>Data Availability</title>
      <p>The datasets used or analyzed during this study are available from the corresponding author on reasonable request.</p>
    </notes>
    <notes>
      <title>Funding</title>
      <p>This study was supported by the Social Science Fund of Capital Medical University, Beijing, China.</p>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>YG conceptualized the study, designed the consulted index system, interpreted the data, and wrote the manuscript. XW collected and analyzed the data. Both authors approved the final manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Laymouna</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lessard</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Schuster</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Engler</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lebouché</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Roles, users, benefits, and limitations of chatbots in health care: rapid review</article-title>
          <source>J Med Internet Res</source>
          <year>2024</year>
          <month>07</month>
          <day>23</day>
          <volume>26</volume>
          <fpage>e56930</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2024//e56930/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/56930</pub-id>
          <pub-id pub-id-type="medline">39042446</pub-id>
          <pub-id pub-id-type="pii">v26i1e56930</pub-id>
          <pub-id pub-id-type="pmcid">PMC11303905</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>YC</given-names>
            </name>
            <name name-style="western">
              <surname>Kraut</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Mohr</surname>
              <given-names>DC</given-names>
            </name>
          </person-group>
          <article-title>Systematic review and meta-analysis of AI-based conversational agents for promoting mental health and well-being</article-title>
          <source>NPJ Digit Med</source>
          <year>2023</year>
          <month>12</month>
          <day>19</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>236</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-023-00979-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-023-00979-5</pub-id>
          <pub-id pub-id-type="medline">38114588</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-023-00979-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC10730549</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Iacobucci</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>The AI bot will see you now: how technology is changing the doctor-patient relationship</article-title>
          <source>BMJ</source>
          <year>2024</year>
          <month>03</month>
          <day>28</day>
          <volume>384</volume>
          <fpage>q711</fpage>
          <pub-id pub-id-type="doi">10.1136/bmj.q711</pub-id>
          <pub-id pub-id-type="medline">38548277</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>JY</given-names>
            </name>
            <name name-style="western">
              <surname>Maduranayagam</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Suthakar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lokker</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Iorio</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Moher</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Attitudes and perceptions of medical researchers towards the use of artificial intelligence chatbots in the scientific process: an international cross-sectional survey</article-title>
          <source>Lancet Digit Health</source>
          <year>2025</year>
          <month>01</month>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>e94</fpage>
          <lpage>102</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2589-7500(24)00202-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S2589-7500(24)00202-4</pub-id>
          <pub-id pub-id-type="medline">39550312</pub-id>
          <pub-id pub-id-type="pii">S2589-7500(24)00202-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mayer</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mahal</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Geisel</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Geiger</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Staatz</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Zappel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lerch</surname>
              <given-names>SP</given-names>
            </name>
            <name name-style="western">
              <surname>Ehrenthal</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Walter</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ditzen</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>User preferences and trust in hypothetical analog, digitalized and AI-based medical consultation scenarios: an online discrete choice survey</article-title>
          <source>Comput Human Behav</source>
          <year>2024</year>
          <month>12</month>
          <volume>161</volume>
          <fpage>108419</fpage>
          <lpage>60</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/pii/S0747563224002875"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.chb.2024.108419</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Armbruster</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bussmann</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Rothhaas</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Titze</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Grützner</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Freischmidt</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>"Doctor ChatGPT, can you help me?" the patient's perspective: cross-sectional study</article-title>
          <source>J Med Internet Res</source>
          <year>2024</year>
          <month>10</month>
          <day>01</day>
          <volume>26</volume>
          <fpage>e58831</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2024//e58831/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/58831</pub-id>
          <pub-id pub-id-type="medline">39352738</pub-id>
          <pub-id pub-id-type="pii">v26i1e58831</pub-id>
          <pub-id pub-id-type="pmcid">PMC11480680</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Magnante</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Embry</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Mathis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mooney</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Haj-Hassan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cottingham</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Padala</surname>
              <given-names>PR</given-names>
            </name>
          </person-group>
          <article-title>Doctor AI? A pilot study examining responses of artificial intelligence to common questions asked by geriatric patients</article-title>
          <source>Front Artif Intell</source>
          <year>2024</year>
          <month>7</month>
          <day>25</day>
          <volume>7</volume>
          <fpage>1438012</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3389/frai.2024.1438012"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/frai.2024.1438012</pub-id>
          <pub-id pub-id-type="medline">39118788</pub-id>
          <pub-id pub-id-type="pmcid">PMC11306168</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hammond</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zakowski</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Readability, quality and accuracy of generative artificial intelligence chatbots for commonly asked questions about labor epidurals: a comparison of ChatGPT and Bard</article-title>
          <source>Int J Obstet Anesth</source>
          <year>2025</year>
          <month>02</month>
          <volume>61</volume>
          <fpage>104317</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ijoa.2024.104317</pub-id>
          <pub-id pub-id-type="medline">39754839</pub-id>
          <pub-id pub-id-type="pii">S0959-289X(24)00329-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Olszewski</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Watros</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mańczak</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Owoc</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jeziorski</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Brzeziński</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Assessing the response quality and readability of chatbots in cardiovascular health, oncology, and psoriasis: a comparative study</article-title>
          <source>Int J Med Inform</source>
          <year>2024</year>
          <month>10</month>
          <volume>190</volume>
          <fpage>105562</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1386-5056(24)00225-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2024.105562</pub-id>
          <pub-id pub-id-type="medline">39059084</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(24)00225-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sheng</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Assessing ChatGPT as a medical consultation assistant for chronic Hepatitis B: cross-language study of English and Chinese</article-title>
          <source>JMIR Med Inform</source>
          <year>2024</year>
          <month>08</month>
          <day>08</day>
          <volume>12</volume>
          <fpage>e56426</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2024//e56426/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/56426</pub-id>
          <pub-id pub-id-type="medline">39115930</pub-id>
          <pub-id pub-id-type="pii">v12i1e56426</pub-id>
          <pub-id pub-id-type="pmcid">PMC11342014</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Musheyev</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bockelman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Loeb</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kabarriti</surname>
              <given-names>AE</given-names>
            </name>
          </person-group>
          <article-title>Assessment of artificial intelligence chatbot responses to top searched queries about cancer</article-title>
          <source>JAMA Oncol</source>
          <year>2023</year>
          <month>10</month>
          <day>01</day>
          <volume>9</volume>
          <issue>10</issue>
          <fpage>1437</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1001/jamaoncol.2023.2947</pub-id>
          <pub-id pub-id-type="medline">37615960</pub-id>
          <pub-id pub-id-type="pii">2808733</pub-id>
          <pub-id pub-id-type="pmcid">PMC10450581</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stapleton</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Santucci</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cundy</surname>
              <given-names>TP</given-names>
            </name>
            <name name-style="western">
              <surname>Sathianathen</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Quality of information on Wilms tumor from artificial intelligence chatbots: what are your patients and their families reading?</article-title>
          <source>Urology</source>
          <year>2025</year>
          <month>04</month>
          <volume>198</volume>
          <fpage>130</fpage>
          <lpage>4</lpage>
          <pub-id pub-id-type="doi">10.1016/j.urology.2025.01.054</pub-id>
          <pub-id pub-id-type="medline">39914668</pub-id>
          <pub-id pub-id-type="pii">S0090-4295(25)00103-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Owens</surname>
              <given-names>OL</given-names>
            </name>
            <name name-style="western">
              <surname>Leonard</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>Evaluating an AI chatbot "Prostate Cancer Info" for providing quality prostate cancer screening information: cross-sectional study</article-title>
          <source>JMIR Cancer</source>
          <year>2025</year>
          <month>05</month>
          <day>21</day>
          <volume>11</volume>
          <fpage>e72522</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cancer.jmir.org/2025//e72522/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/72522</pub-id>
          <pub-id pub-id-type="medline">40397820</pub-id>
          <pub-id pub-id-type="pii">v11i1e72522</pub-id>
          <pub-id pub-id-type="pmcid">PMC12118940</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Anastasio</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Foote</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Melamed</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Modesitt</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Musa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Rossi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Albright</surname>
              <given-names>BB</given-names>
            </name>
            <name name-style="western">
              <surname>Havrilesky</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Moss</surname>
              <given-names>HA</given-names>
            </name>
          </person-group>
          <article-title>The doc versus the bot: a pilot study to assess the quality and accuracy of physician and chatbot responses to clinical questions in gynecologic oncology</article-title>
          <source>Gynecol Oncol Rep</source>
          <year>2024</year>
          <month>08</month>
          <day>08</day>
          <volume>55</volume>
          <fpage>101477</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2352-5789(24)00156-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.gore.2024.101477</pub-id>
          <pub-id pub-id-type="medline">39224817</pub-id>
          <pub-id pub-id-type="pii">S2352-5789(24)00156-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC11367046</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>He</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Physician versus large language model chatbot responses to web-based questions from autistic patients in Chinese: cross-sectional comparative analysis</article-title>
          <source>J Med Internet Res</source>
          <year>2024</year>
          <month>04</month>
          <day>30</day>
          <volume>26</volume>
          <fpage>e54706</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2024//e54706/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/54706</pub-id>
          <pub-id pub-id-type="medline">38687566</pub-id>
          <pub-id pub-id-type="pii">v26i1e54706</pub-id>
          <pub-id pub-id-type="pmcid">PMC11094593</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ayers</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Poliak</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dredze</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Leas</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Kelley</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Faix</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Goodman</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Longhurst</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Hogarth</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>Comparing physician and artificial intelligence chatbot responses to patient questions posted to a public social media forum</article-title>
          <source>JAMA Intern Med</source>
          <year>2023</year>
          <month>06</month>
          <day>01</day>
          <volume>183</volume>
          <issue>6</issue>
          <fpage>589</fpage>
          <lpage>96</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37115527"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamainternmed.2023.1838</pub-id>
          <pub-id pub-id-type="medline">37115527</pub-id>
          <pub-id pub-id-type="pii">2804309</pub-id>
          <pub-id pub-id-type="pmcid">PMC10148230</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Parasuraman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zeithaml</surname>
              <given-names>VA</given-names>
            </name>
            <name name-style="western">
              <surname>Berry</surname>
              <given-names>LL</given-names>
            </name>
          </person-group>
          <article-title>A conceptual model of service quality and its implications for future research</article-title>
          <source>J Mark</source>
          <year>1985</year>
          <month>09</month>
          <day>01</day>
          <volume>49</volume>
          <issue>4</issue>
          <fpage>41</fpage>
          <lpage>50</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jstor.org/stable/1251430"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/002224298504900403</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Karasan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Erdogan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cinar</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Healthcare service quality evaluation: an integrated decision-making methodology and a case study</article-title>
          <source>Socio-Econ Plan Sci</source>
          <year>2022</year>
          <month>08</month>
          <volume>82</volume>
          <fpage>101234</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/abs/pii/S003801212200012X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.seps.2022.101234</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>QL</given-names>
            </name>
            <name name-style="western">
              <surname>Kong</surname>
              <given-names>LN</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>DX</given-names>
            </name>
          </person-group>
          <article-title>Identifying quality indicators for home care services: a modified Delphi and Analytic Hierarchy Process study</article-title>
          <source>BMC Nurs</source>
          <year>2024</year>
          <month>07</month>
          <day>19</day>
          <volume>23</volume>
          <issue>1</issue>
          <fpage>494</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcnurs.biomedcentral.com/articles/10.1186/s12912-024-02169-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12912-024-02169-4</pub-id>
          <pub-id pub-id-type="medline">39026316</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12912-024-02169-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC11264849</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lemmen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Woopen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Stock</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Systems medicine 2030: a Delphi study on implementation in the German healthcare system</article-title>
          <source>Health Policy</source>
          <year>2021</year>
          <month>01</month>
          <volume>125</volume>
          <issue>1</issue>
          <fpage>104</fpage>
          <lpage>14</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0168-8510(20)30292-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.healthpol.2020.11.010</pub-id>
          <pub-id pub-id-type="medline">33288301</pub-id>
          <pub-id pub-id-type="pii">S0168-8510(20)30292-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xue</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Developing an evaluation index system for service capability of internet hospitals in China: mixed methods study</article-title>
          <source>J Med Internet Res</source>
          <year>2025</year>
          <month>07</month>
          <day>25</day>
          <volume>27</volume>
          <fpage>e72931</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2025//e72931/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/72931</pub-id>
          <pub-id pub-id-type="medline">40712159</pub-id>
          <pub-id pub-id-type="pii">v27i1e72931</pub-id>
          <pub-id pub-id-type="pmcid">PMC12296255</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rakofsky</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>YL</given-names>
            </name>
          </person-group>
          <article-title>Developing medical record-based, healthcare quality indicators for psychiatric hospitals in China: a modified Delphi-Analytic Hierarchy Process study</article-title>
          <source>Int J Qual Health Care</source>
          <year>2019</year>
          <month>12</month>
          <day>31</day>
          <volume>31</volume>
          <issue>10</issue>
          <fpage>733</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1093/intqhc/mzz005</pub-id>
          <pub-id pub-id-type="medline">30753601</pub-id>
          <pub-id pub-id-type="pii">5316183</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Developing quality indicators for cancer hospitals in China: a national modified Delphi process</article-title>
          <source>BMJ Open</source>
          <year>2024</year>
          <month>04</month>
          <day>09</day>
          <volume>14</volume>
          <issue>4</issue>
          <fpage>e082930</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&#38;pmid=38594187"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2023-082930</pub-id>
          <pub-id pub-id-type="medline">38594187</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2023-082930</pub-id>
          <pub-id pub-id-type="pmcid">PMC11015267</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saaty</surname>
              <given-names>RW</given-names>
            </name>
          </person-group>
          <article-title>The analytic hierarchy process—what it is and how it is used</article-title>
          <source>Math Model</source>
          <year>1987</year>
          <volume>9</volume>
          <issue>3-5</issue>
          <fpage>161</fpage>
          <lpage>76</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/pii/0270025587904738"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/0270-0255(87)90473-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Geng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Competency model for dentists in China: results of a Delphi study</article-title>
          <source>PLoS One</source>
          <year>2018</year>
          <month>03</month>
          <day>22</day>
          <volume>13</volume>
          <issue>3</issue>
          <fpage>e0194411</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0194411"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0194411</pub-id>
          <pub-id pub-id-type="medline">29566048</pub-id>
          <pub-id pub-id-type="pii">PONE-D-17-17588</pub-id>
          <pub-id pub-id-type="pmcid">PMC5864007</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hao</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>The development of a performance evaluation index system for Chinese Centers for Disease Control and Prevention: a Delphi consensus study</article-title>
          <source>Glob Health Res Policy</source>
          <year>2024</year>
          <month>07</month>
          <day>23</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>28</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ghrp.biomedcentral.com/articles/10.1186/s41256-024-00367-w"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s41256-024-00367-w</pub-id>
          <pub-id pub-id-type="medline">39044214</pub-id>
          <pub-id pub-id-type="pii">10.1186/s41256-024-00367-w</pub-id>
          <pub-id pub-id-type="pmcid">PMC11265441</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Developing online medical service quality indicators in China from the perspective of online and offline integration: a modified Delphi-analytic hierarchy process study</article-title>
          <source>Int J Qual Health Care</source>
          <year>2023</year>
          <month>06</month>
          <day>16</day>
          <volume>35</volume>
          <issue>2</issue>
          <fpage>mzad038</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37279543"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/intqhc/mzad038</pub-id>
          <pub-id pub-id-type="medline">37279543</pub-id>
          <pub-id pub-id-type="pii">7190135</pub-id>
          <pub-id pub-id-type="pmcid">PMC10275532</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Barletta</surname>
              <given-names>VS</given-names>
            </name>
            <name name-style="western">
              <surname>Caivano</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Colizzi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dimauro</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Piattini</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Clinical-chatbot AHP evaluation based on "quality in use" of ISO/IEC 25010</article-title>
          <source>Int J Med Inform</source>
          <year>2023</year>
          <month>02</month>
          <volume>170</volume>
          <fpage>104951</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2022.104951</pub-id>
          <pub-id pub-id-type="medline">36525800</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(22)00265-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sobowale</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Humphrey</surname>
              <given-names>DK</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the quality of psychotherapy conversational agents: framework development and cross-sectional study</article-title>
          <source>JMIR Form Res</source>
          <year>2025</year>
          <month>07</month>
          <day>02</day>
          <volume>9</volume>
          <fpage>e65605</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://formative.jmir.org/2025//e65605/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/65605</pub-id>
          <pub-id pub-id-type="medline">40600851</pub-id>
          <pub-id pub-id-type="pii">v9i1e65605</pub-id>
          <pub-id pub-id-type="pmcid">PMC12239686</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lei</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Assessing usability of intelligent guidance chatbots in Chinese hospitals: cross-sectional study</article-title>
          <source>Digit Health</source>
          <year>2024</year>
          <month>06</month>
          <day>06</day>
          <volume>10</volume>
          <fpage>20552076241260504</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/20552076241260504?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/20552076241260504</pub-id>
          <pub-id pub-id-type="medline">38854920</pub-id>
          <pub-id pub-id-type="pii">10.1177_20552076241260504</pub-id>
          <pub-id pub-id-type="pmcid">PMC11159538</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shiferaw</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Winter</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mike</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>LN</given-names>
            </name>
          </person-group>
          <article-title>Assessing the accuracy and quality of artificial intelligence (AI) chatbot-generated responses in making patient-specific drug-therapy and healthcare-related decisions</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2024</year>
          <month>12</month>
          <day>24</day>
          <volume>24</volume>
          <issue>1</issue>
          <fpage>404</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-024-02824-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-024-02824-5</pub-id>
          <pub-id pub-id-type="medline">39719573</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-024-02824-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC11668057</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Motegi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shino</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kuwabara</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Takahashi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Matsuyama</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tada</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hagiwara</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chikamatsu</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Comparison of physician and large language model chatbot responses to online ear, nose, and throat inquiries</article-title>
          <source>Sci Rep</source>
          <year>2025</year>
          <month>07</month>
          <day>01</day>
          <volume>15</volume>
          <issue>1</issue>
          <fpage>21346</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-025-06769-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-025-06769-1</pub-id>
          <pub-id pub-id-type="medline">40596359</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-025-06769-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC12215459</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abd-Alrazaq</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Safi</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Alajlani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Warren</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Househ</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Denecke</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Technical metrics used to evaluate health care chatbots: scoping review</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>06</month>
          <day>05</day>
          <volume>22</volume>
          <issue>6</issue>
          <fpage>e18301</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/6/e18301/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/18301</pub-id>
          <pub-id pub-id-type="medline">32442157</pub-id>
          <pub-id pub-id-type="pii">v22i6e18301</pub-id>
          <pub-id pub-id-type="pmcid">PMC7305563</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>YS</given-names>
            </name>
            <name name-style="western">
              <surname>Tae</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>IH</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>JH</given-names>
            </name>
          </person-group>
          <article-title>Availability of ChatGPT to provide medical information for patients with kidney cancer</article-title>
          <source>Sci Rep</source>
          <year>2024</year>
          <month>01</month>
          <day>17</day>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>1542</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-024-51531-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-024-51531-8</pub-id>
          <pub-id pub-id-type="medline">38233511</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-024-51531-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC10794224</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chagas</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Pagano</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Prates</surname>
              <given-names>RO</given-names>
            </name>
            <name name-style="western">
              <surname>Praes</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Ferreguetti</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Vaz</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Reis</surname>
              <given-names>ZS</given-names>
            </name>
            <name name-style="western">
              <surname>Ribeiro</surname>
              <given-names>LB</given-names>
            </name>
            <name name-style="western">
              <surname>Ribeiro</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Pedroso</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Beleigoli</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Oliveira</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Marcolino</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>Evaluating user experience with a chatbot designed as a public health response to the COVID-19 pandemic in Brazil: mixed methods study</article-title>
          <source>JMIR Hum Factors</source>
          <year>2023</year>
          <month>04</month>
          <day>03</day>
          <volume>10</volume>
          <fpage>e43135</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://humanfactors.jmir.org/2023//e43135/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/43135</pub-id>
          <pub-id pub-id-type="medline">36634267</pub-id>
          <pub-id pub-id-type="pii">v10i1e43135</pub-id>
          <pub-id pub-id-type="pmcid">PMC10131797</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chaudhry</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Debi</surname>
              <given-names>HR</given-names>
            </name>
          </person-group>
          <article-title>User perceptions and experiences of an AI-driven conversational agent for mental health support</article-title>
          <source>Mhealth</source>
          <year>2024</year>
          <month>7</month>
          <volume>10</volume>
          <fpage>22</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.21037/mhealth-23-55"/>
          </comment>
          <pub-id pub-id-type="doi">10.21037/mhealth-23-55</pub-id>
          <pub-id pub-id-type="medline">39114462</pub-id>
          <pub-id pub-id-type="pii">mh-10-23-55</pub-id>
          <pub-id pub-id-type="pmcid">PMC11304096</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Noor</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Rao Hill</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Troshani</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Developing a service quality scale for artificial intelligence service agents</article-title>
          <source>Eur J Mark</source>
          <year>2022</year>
          <month>05</month>
          <day>09</day>
          <volume>56</volume>
          <issue>5</issue>
          <fpage>1301</fpage>
          <lpage>36</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/org/science/article/abs/pii/S0309056622000910"/>
          </comment>
          <pub-id pub-id-type="doi">10.1108/EJM-09-2020-0672</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Gong</surname>
              <given-names>YM</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>YB</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Classifying and measuring the service quality of AI chatbot in frontline service</article-title>
          <source>J Bus Res</source>
          <year>2022</year>
          <month>06</month>
          <volume>145</volume>
          <fpage>552</fpage>
          <lpage>68</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jbusres.2022.02.088</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wood</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Exploring the varying effects of chatbot service quality dimensions on customer intentions to switch service agents</article-title>
          <source>Sci Rep</source>
          <year>2025</year>
          <month>07</month>
          <day>02</day>
          <volume>15</volume>
          <issue>1</issue>
          <fpage>22559</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-025-06490-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-025-06490-z</pub-id>
          <pub-id pub-id-type="medline">40596391</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-025-06490-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC12217029</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Radziwill</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Benton</surname>
              <given-names>MC</given-names>
            </name>
          </person-group>
          <article-title>Evaluating quality of chatbots and intelligent conversational agents</article-title>
          <source>arXiv. Preprint posted online April 15, 2017</source>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1704.04579"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1704.04579</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pattanshetti</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Extensive study: performance, metrics and usability of chatbot</article-title>
          <source>Int Res J Eng Technol</source>
          <year>2021</year>
          <month>09</month>
          <volume>8</volume>
          <issue>9</issue>
          <fpage>1527</fpage>
          <lpage>34</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.academia.edu/59222363/IRJET_Extensive_Study_Performance_Metrics_and_Usability_of_Chatbot OR IRJET-V8I9218.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Borsci</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Malizia</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schmettow</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>van der Velde</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Tariverdiyeva</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Balaji</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Chamberlain</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>The chatbot usability scale: the design and pilot of a usability scale for interaction with AI-based conversational agents</article-title>
          <source>Pers Ubiquit Comput</source>
          <year>2021</year>
          <month>07</month>
          <day>21</day>
          <volume>26</volume>
          <issue>1</issue>
          <fpage>95</fpage>
          <lpage>119</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1007/s00779-021-01582-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/S00779-021-01582-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pelau</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Dabija</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Ene</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>What makes an AI device human-like? The role of interaction quality, empathy and perceived psychological anthropomorphic characteristics in the acceptance of artificial intelligence in the service industry</article-title>
          <source>Comput Human Behav</source>
          <year>2021</year>
          <month>09</month>
          <volume>122</volume>
          <fpage>106855</fpage>
          <pub-id pub-id-type="doi">10.1016/j.chb.2021.106855</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>YL</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Can chatbots satisfy me? A mixed-method comparative study of satisfaction with task-oriented chatbots in mainland China and Hong Kong</article-title>
          <source>Comput Human Behav</source>
          <year>2023</year>
          <month>06</month>
          <volume>143</volume>
          <fpage>107716</fpage>
          <pub-id pub-id-type="doi">10.1016/j.chb.2023.107716</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chopra</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ranjani</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Narsipur</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Service quality dimensions in AI-enabled chatbots leading to customer satisfaction: a study from South Asia</article-title>
          <source>IIFT Int Bus Manag Rev</source>
          <year>2023</year>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>26</fpage>
          <lpage>49</lpage>
          <pub-id pub-id-type="doi">10.1177/jiift.221150355</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shahzad</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>An</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Javed</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Assessing the impact of AI-chatbot service quality on user e-brand loyalty through chatbot user trust, experience and electronic word of mouth</article-title>
          <source>J Retail Consum Serv</source>
          <year>2024</year>
          <month>07</month>
          <volume>79</volume>
          <fpage>103867</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/abs/pii/S0969698924001632"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jretconser.2024.103867</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Young</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>GY</given-names>
            </name>
          </person-group>
          <article-title>User satisfaction with the service quality of ChatGPT</article-title>
          <source>Serv Bus</source>
          <year>2024</year>
          <month>09</month>
          <day>02</day>
          <volume>18</volume>
          <issue>3-4</issue>
          <fpage>417</fpage>
          <lpage>31</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://link.springer.com/article/10.1007/s11628-024-00566-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/S11628-024-00566-y</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fanous</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Steffner</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Daneshjou</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Patient attitudes toward the AI doctor</article-title>
          <source>Nat Med</source>
          <year>2024</year>
          <month>11</month>
          <day>23</day>
          <volume>30</volume>
          <issue>11</issue>
          <fpage>3057</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1038/s41591-024-03272-4</pub-id>
          <pub-id pub-id-type="medline">39313596</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-024-03272-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Büker</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mercan</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Readability, accuracy and appropriateness and quality of AI chatbot responses as a patient information source on root canal retreatment: a comparative assessment</article-title>
          <source>Int J Med Inform</source>
          <year>2025</year>
          <month>09</month>
          <volume>201</volume>
          <fpage>105948</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2025.105948</pub-id>
          <pub-id pub-id-type="medline">40288015</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(25)00165-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Grilo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Marques</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Corte-Real</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Carolino</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Caetano</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Assessing the quality and reliability of ChatGPT's responses to radiotherapy-related patient queries: comparative study with GPT-3.5 and GPT-4</article-title>
          <source>JMIR Cancer</source>
          <year>2025</year>
          <month>04</month>
          <day>16</day>
          <volume>11</volume>
          <fpage>e63677</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cancer.jmir.org/2025//e63677/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/63677</pub-id>
          <pub-id pub-id-type="medline">40239208</pub-id>
          <pub-id pub-id-type="pii">v11i1e63677</pub-id>
          <pub-id pub-id-type="pmcid">PMC12017613</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
