<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="review-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v22i6e18301</article-id>
      <article-id pub-id-type="pmid">32442157</article-id>
      <article-id pub-id-type="doi">10.2196/18301</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Review</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Review</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Technical Metrics Used to Evaluate Health Care Chatbots: Scoping Review</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Lovis</surname>
            <given-names>Christian</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Iqbal</surname>
            <given-names>Dr. Usman</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Bellei</surname>
            <given-names>Ericles</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Abd-Alrazaq</surname>
            <given-names>Alaa</given-names>
          </name>
          <degrees>BSc, MSc, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7695-4626</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Safi</surname>
            <given-names>Zeineb</given-names>
          </name>
          <degrees>BSc, MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0526-8949</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Alajlani</surname>
            <given-names>Mohannad</given-names>
          </name>
          <degrees>BSc, MSc, MBA, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5691-7120</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Warren</surname>
            <given-names>Jim</given-names>
          </name>
          <degrees>BS, PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8660-8951</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Househ</surname>
            <given-names>Mowafa</given-names>
          </name>
          <degrees>BCom, MEng, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3648-6271</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Denecke</surname>
            <given-names>Kerstin</given-names>
          </name>
          <degrees>Dr rer nat</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <address>
            <institution>Institute for Medical Informatics</institution>
            <institution>Bern University of Applied Sciences</institution>
            <addr-line>Quellgasse 21</addr-line>
            <addr-line>2502 Biel</addr-line>
            <addr-line>Bern</addr-line>
            <country>Switzerland</country>
            <phone>41 76 409 97 61</phone>
            <email>kerstin.denecke@bfh.ch</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6691-396X</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>College of Science and Engineering</institution>
        <institution>Hamad Bin Khalifa University</institution>
        <addr-line>Doha</addr-line>
        <country>Qatar</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Institute of Digital Healthcare</institution>
        <institution>University of Warwick</institution>
        <addr-line>Coventry</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>School of Computer Science</institution>
        <institution>University of Auckland</institution>
        <addr-line>Auckland</addr-line>
        <country>New Zealand</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Institute for Medical Informatics</institution>
        <institution>Bern University of Applied Sciences</institution>
        <addr-line>Bern</addr-line>
        <country>Switzerland</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Kerstin Denecke <email>kerstin.denecke@bfh.ch</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>6</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>5</day>
        <month>6</month>
        <year>2020</year>
      </pub-date>
      <volume>22</volume>
      <issue>6</issue>
      <elocation-id>e18301</elocation-id>
      <history>
        <date date-type="received">
          <day>18</day>
          <month>2</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>8</day>
          <month>4</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>13</day>
          <month>4</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>15</day>
          <month>4</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Alaa Abd-Alrazaq, Zeineb Safi, Mohannad Alajlani, Jim Warren, Mowafa Househ, Kerstin Denecke. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 05.06.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://www.jmir.org/2020/6/e18301/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Dialog agents (chatbots) have a long history of application in health care, where they have been used for tasks such as supporting patient self-management and providing counseling. Their use is expected to grow with increasing demands on health systems and improving artificial intelligence (AI) capability. Approaches to the evaluation of health care chatbots, however, appear to be diverse and haphazard, resulting in a potential barrier to the advancement of the field.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to identify the technical (nonclinical) metrics used by previous studies to evaluate health care chatbots.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Studies were identified by searching 7 bibliographic databases (eg, MEDLINE and PsycINFO) in addition to conducting backward and forward reference list checking of the included studies and relevant reviews. The studies were independently selected by two reviewers who then extracted data from the included studies. Extracted data were synthesized narratively by grouping the identified metrics into categories based on the aspect of chatbots that the metrics evaluated.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Of the 1498 citations retrieved, 65 studies were included in this review. Chatbots were evaluated using 27 technical metrics, which were related to chatbots as a whole (eg, usability, classifier performance, speed), response generation (eg, comprehensibility, realism, repetitiveness), response understanding (eg, chatbot understanding as assessed by users, word error rate, concept error rate), and esthetics (eg, appearance of the virtual agent, background color, and content).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The technical metrics of health chatbot studies were diverse, with survey designs and global usability metrics dominating. The lack of standardization and paucity of objective measures make it difficult to compare the performance of health chatbots and could inhibit advancement of the field. We suggest that researchers more frequently include metrics computed from conversation logs. In addition, we recommend the development of a framework of technical metrics with recommendations for specific circumstances for their inclusion in chatbot studies.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>chatbots</kwd>
        <kwd>conversational agents</kwd>
        <kwd>health care</kwd>
        <kwd>evaluation</kwd>
        <kwd>metrics</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>The potential of human-computer dialog to provide health care benefits has been perceived for many decades. In 1966, Weizenbaum’s ELIZA system caught the public imagination with its imitation of a psychotherapist through the relatively simple linguistic token manipulation possible at the time [<xref ref-type="bibr" rid="ref1">1</xref>]. From the mid-1990s, a family of interventions based on automated telephone sessions (telephone-linked care) demonstrated effectiveness in promoting health adherence across a range of behaviors including medication, diet, and physical activity [<xref ref-type="bibr" rid="ref2">2</xref>]. As mobile phones have become commonplace, a range of SMS text messaging–based interventions have been developed and trialed, with particular success in smoking cessation [<xref ref-type="bibr" rid="ref3">3</xref>]. At the same time, internet/web-based interventions have shown the ability to promote positive health behavior change [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>], and the interaction components associated with users sticking with an internet intervention are increasingly well understood and include the inclusion of dialog elements [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
        <p>With the advent of smartphones, the distribution of highly interactive chatbots has been greatly facilitated, particularly with the ubiquitous use of app stores and wide installation of chat apps that can include chatbots, notably Facebook Messenger. Chatbots, as with other electronic health (eHealth) interventions, offer scalability and 24-hour availability to plug gaps in unmet health needs. For example, Woebot delivers cognitive behavior therapy and has been tested with students with depression [<xref ref-type="bibr" rid="ref7">7</xref>]. The students who used Woebot significantly reduced their symptoms of depression over the study period as measured by the depression questionnaire PHQ-9, while those in the information control group (who instead read a self-help book) did not [<xref ref-type="bibr" rid="ref7">7</xref>]. In recent years, artificial intelligence (AI) based on deep learning has created waves with its ability to outperform physicians at some diagnostic tasks [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. XiaoIce is a social chatbot that emphasizes emotional connection and it has communicated with over 660 million active users since its launch in 2014 [<xref ref-type="bibr" rid="ref10">10</xref>]; its performance shows that deep learning can be successfully applied to meaningful dialog tasks. Combining the factors of ease-of-distribution, successful applications, and AI methods to improve health chatbot performance, it is reasonable to expect health chatbots in increasing numbers and variety to take an increasingly serious role in the health care system.</p>
      </sec>
      <sec>
        <title>Research Problem and Aim</title>
        <p>To be an evidence-based discipline requires measurement of performance. The impact of health chatbots on clinical outcomes is the ultimate measure of success. For example, did the condition (eg, depression, diabetes) improve to a statistically significant degree on an accepted measure (eg, PHQ-9 [<xref ref-type="bibr" rid="ref11">11</xref>] or hemoglobin A1c [<xref ref-type="bibr" rid="ref12">12</xref>], respectively), as compared to a control group? Such studies, however, may require large sample sizes to detect the effect and provide relatively little insight into the mechanism by which the chatbot achieves the change; additionally, studies may provide particularly little insight if the result is negative.</p>
        <p>As an alternative and useful precursor to clinical outcome metrics, technical metrics concern the performance of the chatbot itself (eg, did participants feel that it was usable, give appropriate responses, and understand their input?). Appropriateness refers to the relevance of the provided information in addressing the problem prompted [<xref ref-type="bibr" rid="ref13">13</xref>]. Furthermore, this includes more objective measures of the chatbot interaction, such as the number of conversational turns taken in a session or time taken, and measures that require some interpretation but are still well-defined, such as task completion. These technical measures offer a potential method for comparison of health chatbots and for understanding the use and performance of a chatbot to decide if it is working well enough to warrant the time and expense of a trial to measure clinical outcomes.</p>
        <p>Previously, we had introduced a framework for evaluation measures of health chatbots to provide guidance to developers [<xref ref-type="bibr" rid="ref14">14</xref>]. The framework development, however, was based on a relatively informal process vulnerable to the authors’ biases in terms of what studies were considered in its formulation. Therefore, the aim of this study is to use a rigorous review methodology to identify the technical metrics used by previous studies to evaluate health care chatbots. The final goal of these efforts is to be able to make recommendations for an evaluation framework for health chatbots.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview</title>
        <p>To achieve the aforementioned objective, a scoping review was conducted. To conduct a transparent and replicable review, we followed the PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) Extension for Scoping Reviews (PRISMA-ScR) guidelines [<xref ref-type="bibr" rid="ref15">15</xref>]. This research was conducted by an interdisciplinary team of researchers with backgrounds in nursing, computer science, and mental health applications.</p>
      </sec>
      <sec>
        <title>Search Strategy</title>
        <sec>
          <title>Search Sources</title>
          <p>For this review, we searched the following bibliographic databases November 1-3, 2019: MEDLINE (via EBSCO), EMBASE (Excerpta Medica Database; via Ovid), PsycINFO (via Ovid), CINAHL (Cumulative Index of Nursing and Allied Health Literature; via EBSCO), IEEE (Institute of Electrical and Electronics Engineers) Xplore, ACM (Association for Computing Machinery) Digital Library, and Google Scholar. We screened only the first 100 hits retrieved by searching Google Scholar, as it usually retrieves several thousand references ordered by their relevance to the search topic. We checked the reference list of the included studies to identify further studies relevant to the current review (ie, backward reference list checking). Additionally, we used the “cited by” function available in Google Scholar to find and screen studies that cited the included studies (ie, forward reference list checking).</p>
        </sec>
        <sec>
          <title>Search Terms</title>
          <p>The search terms were derived from previously published literature and the opinions of informatics experts. For health-related databases, we used search terms related to the intervention of interest (eg, chatbot, conversational agent, and chat-bot). In addition to intervention-related terms, we used terms related to the context (eg, health, disease, and medical) for non–health-related databases (eg, IEEE and ACM digital library). <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> details the search strings used for searching each electronic database.</p>
        </sec>
      </sec>
      <sec>
        <title>Study Eligibility Criteria</title>
        <p>The intervention of interest in this review was chatbots that are aimed at delivering health care services to patients. Chatbots implemented in stand-alone software or web-based platforms were included. However, we excluded chatbots operated by a human (Wizard-of-Oz) or integrated into robotics, serious games, SMS text messaging, or telephone systems. To be included, studies had to report a technical evaluation of a chatbot (eg, usability, classifier performance, and word error rate). We included peer-reviewed articles, dissertations, and conference proceedings, and we excluded reviews, proposals, editorials, and conference abstracts. This review included studies written in the English language only. No restrictions were considered regarding the study design, study setting, year of publication, and country of publication.</p>
      </sec>
      <sec>
        <title>Study Selection</title>
        <p>Authors MA and ZS independently screened the titles and abstracts of all retrieved references and then independently read the full texts of included studies. Any disagreements between the two reviewers were resolved by AA. We assessed the intercoder agreement by calculating Cohen, which was 0.82 for screening titles and abstracts and 0.91 for reading full texts, indicating a very good agreement [<xref ref-type="bibr" rid="ref16">16</xref>].</p>
      </sec>
      <sec>
        <title>Data Extraction</title>
        <p>To conduct a reliable and accurate extraction of data from the included studies, a data extraction form was developed and piloted using 8 included studies (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). The data extraction process was independently conducted by two reviewers (MA and ZS) and a third reviewer (AA) resolved any disagreements. Intercoder agreement between the reviewers was good (Cohen κ=0.67).</p>
      </sec>
      <sec>
        <title>Data Synthesis</title>
        <p>A narrative approach was used to synthesize the extracted data. After identifying all technical metrics used by the included studies to evaluate chatbots, we divided them into 4 categories based on the aspect of chatbots that the metrics evaluate. The 4 categories were formed after a discussion by the authors in which consensus was reached. For each metric, we identified how the studies measured it. Data synthesis was managed using Microsoft Excel (Microsoft Corporation).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Search Results</title>
        <p>By searching the 7 electronic databases, 1498 citations were retrieved. After removing 199 (13.3%) duplicates of these citations, 1299 (86.7%) titles and abstracts were screened. The screening process resulted in excluding 1113 (74.3%) titles and abstracts due to several reasons detailed in <xref rid="figure1" ref-type="fig">Figure 1</xref>. When we read the full text of the remaining 186 (12.4%) citations, a further 133 (8.9%) citations were excluded (<xref rid="figure1" ref-type="fig">Figure 1</xref>). In total, 12 studies were found by backward and forward reference checking. We included 65 studies in the review.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Flowchart of the study selection process.</p>
          </caption>
          <graphic xlink:href="jmir_v22i6e18301_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Description of Included Studies</title>
        <p>Characteristics of the included studies are detailed in <xref ref-type="table" rid="table1">Table 1</xref>. Cross-sectional survey was the most commonly used study design (n=41, 63%). About 57% (n=37) of the included studies were published as journal articles. Half of the studies (n=33, 51%) were conducted in the United States. Approximately 70% (n=45) of the studies were published between 2015 and 2019.</p>
        <p>The sample size was reported in 61 studies, and 38 studies (62%) had 50 or fewer participants. In 44 studies, the age of participants was reported; the mean age of participants was 39 years, with a range of 13-79 years. Sex of participants was reported in 54 studies, where the mean percentage of males was 48.1%. Of the 62 studies that reported participants’ health conditions, 34 (54.8%) studies recruited participants from a clinical population (ie, those with health issues). Participants were recruited from clinical settings (n=30, 49.2%), community (n=20, 32.8%), and educational settings (n=18, 29.5%). Metadata and population characteristics of each included study are presented in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>.</p>
        <p>Chatbots were used for self-management (n=17, 26.2%), therapeutic purposes (n=12, 18.5%), counselling (n=12, 18.5%), education (n=10, 15.4%), screening (n=9, 13.8%), training (n=7, 10.8%), and diagnosing (n=3, 4.6%). Although chatbots were implemented in stand-alone software in about 62% (n=40) of studies, chatbots were implemented in web-based platforms in the remaining studies (n=25, 39%). Chatbot responses were generated based on predefined rules, machine learning approaches, or both methods (hybrid) in 82% (N=53), 17% (n=11), and 2% (n=1) of the included studies, respectively. In the majority of studies (n=58, 89%), chatbots led the dialogue. In about 62% (n=40) of studies, users interacted with chatbots only by typing in their utterances (texts). The most common modalities used by chatbots to interact with users were a combination of text, voice, and nonverbal language (ie, facial expression and body language; n=21, 32%), text only (n=20, 31%), and a combination of voice and nonverbal language (n=19, 29%). The most common disorders targeted by chatbots were any health condition (n=20, 31%) and depression (n=15, 23%). <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref> displays characteristics of the intervention in each included study.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Characteristics of the included studies (N=65).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="30"/>
            <col width="540"/>
            <col width="0"/>
            <col width="400"/>
            <thead>
              <tr valign="bottom">
                <td colspan="4">Parameters and characteristics</td>
                <td>Studies, n (%)<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="5">
                  <bold>Study metadata</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="4">
                  <bold>Study design</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Survey</td>
                <td colspan="2">41 (63)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Quasi-experiment</td>
                <td colspan="2">11 (17)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Randomized controlled trial</td>
                <td colspan="2">13 (20)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="4">
                  <bold>Type of publication</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Journal article</td>
                <td colspan="2">37 (57)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Conference proceeding</td>
                <td colspan="2">25 (39)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Thesis</td>
                <td colspan="2">3 (5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="4">
                  <bold>Country</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>United States</td>
                <td colspan="2">33 (51)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>France</td>
                <td colspan="2">5 (8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Netherlands</td>
                <td colspan="2">3 (5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Japan</td>
                <td colspan="2">3 (5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Australia</td>
                <td colspan="2">3 (5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Italy</td>
                <td colspan="2">2 (3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Switzerland and Netherlands</td>
                <td colspan="2">2 (3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Finland</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Sweden</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Turkey</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>United Kingdom</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Switzerland &#38; Germany</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Mexico</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Spain</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Global population</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Romania, Spain and Scotland</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Philippines</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Switzerland</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>New Zealand</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Spain and New Zealand</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>South Africa</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="4">
                  <bold>Year of publication</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Before 2010</td>
                <td colspan="2">3 (5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>2010-2014</td>
                <td colspan="2">17 (26)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>2015-2019</td>
                <td colspan="2">45 (70)</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Population</bold>
                  <bold>characteristics</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="4">
                  <bold>Sample size<sup>b</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>≤50</td>
                <td colspan="2">38 (62)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>51-100</td>
                <td colspan="2">11 (18)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>101-200</td>
                <td colspan="2">9 (15)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>&#62;200</td>
                <td colspan="2">3 (5)</td>
              </tr>
              <tr valign="bottom">
                <td>
                  <break/>
                </td>
                <td colspan="4">
                  <bold>Age (years)<sup>c</sup></bold>
                </td>
              </tr>
              <tr valign="bottom">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Mean (range) </td>
                <td colspan="2">39 (13-79)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="4">
                  <bold>Sex (%)<sup>e</sup></bold>
                </td>
              </tr>
              <tr valign="bottom">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td colspan="2">48.1</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="4">
                  <bold>Health condition<sup>f</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Clinical sample</td>
                <td colspan="2">34 (55)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Nonclinical sample</td>
                <td colspan="2">28 (45)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="4">
                  <bold>Setting<sup>g,h</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Clinical</td>
                <td colspan="2">30 (50)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Community</td>
                <td colspan="2">20 (33)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Educational</td>
                <td colspan="2">18 (30)</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Intervention characteristics</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="4">
                  <bold>Purpose<sup>i</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Self-management</td>
                <td colspan="2">17 (26)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Therapy</td>
                <td colspan="2">12 (19)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Counselling</td>
                <td colspan="2">12 (19)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Education</td>
                <td colspan="2">10 (15)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Screening</td>
                <td colspan="2">9 (14)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Training</td>
                <td colspan="2">7 (11)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Diagnosing</td>
                <td colspan="2">3 (5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="4">
                  <bold>Platform</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Stand-alone software</td>
                <td colspan="2">40 (62)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Web-based</td>
                <td colspan="2">25 (39)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="4">
                  <bold>Response generation</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Rule-based</td>
                <td colspan="2">53 (82)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Artificial intelligence</td>
                <td colspan="2">11 (17)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Hybrid</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="4">
                  <bold>Dialogue initiative</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Chatbot</td>
                <td colspan="2">58 (89)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Users</td>
                <td colspan="2">4 (6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Both</td>
                <td colspan="2">3 (5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="4">
                  <bold>Input modality</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Text</td>
                <td colspan="2">40 (62)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Voice</td>
                <td colspan="2">9 (14)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Voice and nonverbal</td>
                <td colspan="2">8 (12)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Text and voice</td>
                <td colspan="2">6 (9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Text and nonverbal</td>
                <td colspan="2">2 (3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="4">
                  <bold>Output modality</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Text, voice and nonverbal</td>
                <td colspan="2">21 (32)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Text</td>
                <td colspan="2">20 (31)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Voice and nonverbal</td>
                <td colspan="2">19 (29)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Text &#38; voice</td>
                <td colspan="2">4 (6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Voice</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="4">
                  <bold>Targeted disorders<sup>j</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Any health condition</td>
                <td colspan="2">20 (31)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Depression</td>
                <td colspan="2">15 (23)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Autism</td>
                <td colspan="2">5 (8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Anxiety</td>
                <td colspan="2">5 (8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Substance use disorder</td>
                <td colspan="2">5 (8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Posttraumatic stress disorder</td>
                <td colspan="2">5 (8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Mental disorders</td>
                <td colspan="2">3 (5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Sexually transmitted diseases</td>
                <td colspan="2">3 (5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Sleep disorders</td>
                <td colspan="2">2 (3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Diabetes</td>
                <td colspan="2">2 (3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Alzheimer</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Asthma</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Cervical cancer</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Dementia</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Schizophrenia</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Stress</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Genetic variants</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Cognitive impairment</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Atrial fibrillation</td>
                <td colspan="2">1 (2)</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <break/>
                </td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Percentages were rounded and may not sum to 100.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>Sample size was reported in 61 studies.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>Mean age was reported in 44 studies.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>N/A: not applicable.</p>
            </fn>
            <fn id="table1fn5">
              <p><sup>e</sup>Sex was reported in 54 studies.</p>
            </fn>
            <fn id="table1fn6">
              <p><sup>f</sup>Sample type was reported in 62 studies.</p>
            </fn>
            <fn id="table1fn7">
              <p><sup>g</sup>Setting was reported in 61 studies.</p>
            </fn>
            <fn id="table1fn8">
              <p><sup>h</sup>Numbers do not add up as several chatbots focused on more than one health condition.</p>
            </fn>
            <fn id="table1fn9">
              <p><sup>i</sup>Numbers do not add up as several chatbots have more than one purpose.</p>
            </fn>
            <fn id="table1fn10">
              <p><sup>j</sup>Numbers do not add up as several chatbots target more than one health condition.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Results of Studies</title>
        <sec>
          <title>Overview</title>
          <p>The included studies evaluated chatbots using many technical metrics, which were categorized into 4 main groups: metrics related to chatbots as a whole (global metrics), metrics related to response generation, metrics related to response understanding, and metrics related to esthetics. More details about metrics are presented in the following sections.</p>
        </sec>
        <sec>
          <title>Global Metrics</title>
          <p>The included studies evaluated chatbots as a whole using the following metrics: usability, classifier performance, speed, technical issues, intelligence, task completion rate, dialogue efficiency, dialogue handling, context awareness, and error management.</p>
          <p>Usability of chatbots was assessed in 37 (56.9%) studies [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref53">53</xref>]. Usability was evaluated using a single question in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref47">47</xref>-<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref53">53</xref>], multiple questions in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref43">43</xref>], a specific questionnaire (eg, system usability scale [SUS] questionnaire) [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref52">52</xref>], or observation [<xref ref-type="bibr" rid="ref19">19</xref>].</p>
          <p>Classifier performance of chatbots was evaluated in 8 (12.3%) studies [<xref ref-type="bibr" rid="ref54">54</xref>-<xref ref-type="bibr" rid="ref61">61</xref>]. Many metrics were used to measure the classifier performance, namely: area under curve [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref61">61</xref>], accuracy [<xref ref-type="bibr" rid="ref56">56</xref>-<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref61">61</xref>], sensitivity [<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref60">60</xref>], specificity [<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref60">60</xref>], positive predictive value [<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref60">60</xref>], and negative predictive value [<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref60">60</xref>]. The speed of chatbots was examined in 4 studies [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref62">62</xref>]. The speed was evaluated using a single question in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref35">35</xref>], multiple questions in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref53">53</xref>], and interviews [<xref ref-type="bibr" rid="ref62">62</xref>].</p>
          <p>Technical issues (eg, errors/glitches) in chatbots were examined in 4 studies (6.2%) [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref63">63</xref>]. Technical issues were assessed through interviews [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref63">63</xref>], a single question in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref36">36</xref>], and checking staff logs [<xref ref-type="bibr" rid="ref51">51</xref>]. In addition, 3 studies assessed the intelligence of chatbots using either multiple questions in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref64">64</xref>] or a single question in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref27">27</xref>]. In 3 studies, the task completion rate was examined by checking the conversation logs [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref65">65</xref>].</p>
          <p>Of the reviewed studies, 2 (3.1%) studies examined chatbot flexibility in dialogue handling (eg, its ability to maintain a conversation and deal with users’ generic questions or responses that require more, less, or different information than was requested) using interviews [<xref ref-type="bibr" rid="ref27">27</xref>] and multiple questions in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref38">38</xref>]. Dialogue efficiency of chatbots, which refers to the number of dialogue steps required to finish a task, was assessed in 1 study by reviewing transcribed conversation logs [<xref ref-type="bibr" rid="ref38">38</xref>]. The same study examined the chatbot’s context awareness (ie, its ability to utilize contextual knowledge to appropriately respond to users) using multiple questions in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref38">38</xref>]. Error management, which refers to a chatbot’s ability to detect and understand misspelled words in users’ replies (eg, “anious” instead of anxious), was examined in only 1 study [<xref ref-type="bibr" rid="ref27">27</xref>].</p>
        </sec>
        <sec>
          <title>Metrics Related to Response Generation</title>
          <p>The following metrics were utilized by the included studies to evaluate response generation by chatbots: appropriateness of responses, comprehensibility, realism, speed of response, empathy, repetitiveness, clarity of speech, and linguistic accuracy.</p>
          <p>Of the reviewed studies, 15 (23.1%) examined the appropriateness and adequacy of verbal [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref66">66</xref>-<xref ref-type="bibr" rid="ref69">69</xref>] and nonverbal responses of chatbots [<xref ref-type="bibr" rid="ref32">32</xref>]. Appropriateness of responses was assessed using interviews [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref68">68</xref>], a single question in self-administrated questionnaire [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref67">67</xref>], conversation logs [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref69">69</xref>], and multiple questions in self-administrated questionnaire [<xref ref-type="bibr" rid="ref28">28</xref>].</p>
          <p>Comprehensibility of responses, which refers to the degree to which a chatbot generates responses understandable by users, was evaluated by 14 (21.5%) studies [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref69">69</xref>]. Comprehensibility of responses was evaluated using a single question in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref69">69</xref>] and interviews [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref51">51</xref>].</p>
          <p>In total, 14 (21.5%) studies assessed how human-like chatbots are (realism) [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref70">70</xref>-<xref ref-type="bibr" rid="ref72">72</xref>]. Realism of chatbots was examined in terms of verbal responses only [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref70">70</xref>], nonverbal responses only [<xref ref-type="bibr" rid="ref66">66</xref>], or both verbal and nonverbal responses [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref71">71</xref>,<xref ref-type="bibr" rid="ref72">72</xref>]. The included studies evaluated realism using a single question in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref70">70</xref>], multiple questions in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref72">72</xref>], and interviews [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref71">71</xref>].</p>
          <p>Altogether, 11 (16.9%) studies assessed the speed of a chatbot’s responses [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref68">68</xref>-<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref73">73</xref>]. The speed of responses was examined using a single question in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref73">73</xref>], interviews [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref68">68</xref>], multiple questions in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref53">53</xref>], and system logs [<xref ref-type="bibr" rid="ref38">38</xref>]. Empathy of a chatbot, which refers to its ability to show empathy to users, was examined in 10 studies [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref71">71</xref>,<xref ref-type="bibr" rid="ref73">73</xref>,<xref ref-type="bibr" rid="ref74">74</xref>]. Those studies evaluated empathy using a single question in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref71">71</xref>,<xref ref-type="bibr" rid="ref73">73</xref>], interviews [<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref71">71</xref>], and multiple questions in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref64">64</xref>].</p>
          <p>Repetitiveness of a chatbot’s responses was examined in 9 (13.8%) studies [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref73">73</xref>,<xref ref-type="bibr" rid="ref75">75</xref>,<xref ref-type="bibr" rid="ref76">76</xref>]. Repetitiveness of responses was evaluated using a single question in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref73">73</xref>] and interviews [<xref ref-type="bibr" rid="ref66">66</xref>,<xref ref-type="bibr" rid="ref75">75</xref>,<xref ref-type="bibr" rid="ref76">76</xref>]. We found that 6 (9.2%) studies evaluated clarity or quality of speech using either interviews [<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref75">75</xref>] or a single question in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref77">77</xref>]. Linguistic accuracy of a chatbot’s responses was evaluated in 2 (3.7%) studies using a single question in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref35">35</xref>].</p>
        </sec>
        <sec>
          <title>Metrics Related to Response Understanding</title>
          <p>The included studies evaluated chatbot understanding of users’ responses using the following metrics: understanding as assessed by users, word error rate, concept error rate, and attention estimator errors.</p>
          <p>Chatbot understanding, which refers to a chatbot’s ability to adequately understand the verbal and nonverbal responses of users, was assessed by 20 (30.8%) studies [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref73">73</xref>,<xref ref-type="bibr" rid="ref78">78</xref>,<xref ref-type="bibr" rid="ref79">79</xref>]. Of those studies, 2 studies assessed understanding of both verbal and nonverbal responses [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref79">79</xref>], 1 study assessed understanding of nonverbal responses only [<xref ref-type="bibr" rid="ref32">32</xref>], and the remaining studies assessed understanding of verbal responses only. The understanding of responses was evaluated using multiple questions in a self-administrated questionnaire in 4 studies [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref78">78</xref>,<xref ref-type="bibr" rid="ref79">79</xref>], interviews in 2 studies [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref68">68</xref>], and a single question in a self-administrated questionnaire in the remaining studies.</p>
          <p>Word error rate, which assesses the performance of speech recognition in chatbots, was examined in 2 (3.7%) studies using conversational logs [<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref69">69</xref>]. Concept error rate, which depends on the correct recognition of the semantic result of a user utterance, was evaluated in 1 study by checking conversational logs [<xref ref-type="bibr" rid="ref65">65</xref>]. Attention estimation, which refers to a chatbot’s ability to determine whether the user is gazing toward the screen or away from it, was examined in 1 study by checking conversational logs [<xref ref-type="bibr" rid="ref69">69</xref>].</p>
        </sec>
        <sec>
          <title>Metrics Related to Esthetics</title>
          <p>The included studies evaluated the esthetics of chatbots using the following metrics: appearance of the virtual agent, background color and content, font type and size, button color, shape, icon, and background color contrast.</p>
          <p>In total, 5 (7.7%) studies assessed the appearance of the virtual agent using a single question in a self-administrated questionnaire [<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref77">77</xref>,<xref ref-type="bibr" rid="ref80">80</xref>], interviews [<xref ref-type="bibr" rid="ref51">51</xref>], and focus groups [<xref ref-type="bibr" rid="ref45">45</xref>]. In addition, 1 (1.5%) study evaluated background color, color contrast, and content; font type and size; and button color, shape, and icon using a survey [<xref ref-type="bibr" rid="ref80">80</xref>].</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>It became clear that there is currently no standard method in use to evaluate health chatbots. Most aspects are studied using self-administered questionnaires or user interviews. Common metrics are response speed, word error rate, concept error rate, dialogue efficiency, attention estimation, and task completion. Various studies assessed different aspects of chatbots, complicating direct comparison. Although some of this variation may be due to the individual characteristics of chatbot implementations and their distinct use cases, it is difficult to see why metrics such as appropriateness of responses, comprehensibility, realism, speed of response, empathy and repetitiveness are each only applicable to a small percentage of cases. Further, objective quantitative metrics (eg, those based on log reviews) were comparatively rarely used in the reported studies. We thus suggest continuing research and development toward an evaluation framework for technical metrics with recommendations for specific circumstances for their inclusion in chatbot studies.</p>
        <p>Jadeja et al [<xref ref-type="bibr" rid="ref81">81</xref>] introduced 4 dimensions for chatbot evaluations: the information retrieval (IR) perspective, the user experience (UX) perspective, the linguistic perspective, and the AI (human-likeness) perspective. In earlier work [<xref ref-type="bibr" rid="ref14">14</xref>], we adapted and broadened this categorization, modifying the IR perspective to a task-oriented perspective since health chatbots are not necessarily designed only to retrieve information; additionally, we included system quality and health care quality perspectives. Excluding the health care quality perspective, which is outside the definition of technical metrics, the findings of this scoping review show that all these dimensions are indeed represented in health chatbot evaluations. Rather, the issue appears to be the inconsistency in what is measured and how, along with the skew toward self-reporting and the UX perspective. Additional work is still required to come up with standard metrics and corresponding assessment tools specifically addressing quality in health chatbots.</p>
        <p>We found usability to be the most commonly assessed aspect of health chatbots. The system usability scale (SUS [<xref ref-type="bibr" rid="ref82">82</xref>,<xref ref-type="bibr" rid="ref83">83</xref>]) is a well-established usability instrument that we observed was used repeatedly, although it was not used in the majority of the studies assessing usability; in many cases, a single survey question was used instead. The SUS is nonproprietary, technology-agnostic, and designed to support comparison across products [<xref ref-type="bibr" rid="ref82">82</xref>]. As such, global assessment of the user experience of health chatbots could be enhanced in quality and comparability by researchers standardizing on inclusion of the SUS in their evaluations. However, studies by Holmes et al [<xref ref-type="bibr" rid="ref84">84</xref>] showed that conventional methods for assessing usability and user experience may not be as accurate when applied to health chatbots. As such, there remains research to be done toward appropriate metrics for health chatbots.</p>
        <p>Conversational-turns per session (CPS) has been suggested as a success metric for social chatbots as exemplified by XiaoIce [<xref ref-type="bibr" rid="ref85">85</xref>]. Although the aims for health chatbots are not identical to those of social chatbots, if CPS gains acceptance as a standard measure in the social chatbot domain, it would make it a leading candidate for a standard measure to include in health chatbot evaluations to assess their social engagement dimension. An alternative or supplementary measure related to the social dimension would be to have users score the chatbot on empathy; however, CPS has the advantage of being an objective and quantitative measure. Other objective and quantitative measures such as interaction time or time on task could be alternatives to CPS, but might be less representative of engagement than CPS if for instance the user was multitasking chatbot interaction with other tasks. Beyond social engagement, task completion (often assessed by analyzing conversation logs) is another promising global measure.</p>
        <p>A further area for standardization would be in the quality of responses. We observed response generation to be widely measured but in very diverse ways. Emergence of standard measures for response generation and understanding would greatly advance the comparability of studies. Development of validated instruments in this area would be a useful contribution to chatbot research.</p>
        <p>We commend the inclusion of classifier performance in health chatbot studies where this is applicable and practical to assess. It could be less meaningful to compare raw performance (eg, as area under the curve) across domains due to differences in difficulty; ideally, chatbot performance would be compared to the performance of a human expert for the task at hand. Further, we perceive the opportunity for a progression of performance measures in health chatbot studies as a given product gains maturity. Good early-stage metrics would be those that assess response quality and response understanding to establish that the product is working well. Subsequent experiments can advance the assessment of self-reported usability and metrics of social engagement. Where applicable, classifier performance can round out technical performance evaluation to establish whether trials to assess clinical outcomes are warranted.</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <sec>
          <title>Strengths</title>
          <p>This study is the first review that summaries the technical metrics used by previous studies to evaluate health care chatbots. This helps readers explore how chatbots were evaluated in health care. Given that this review was executed and reported in line with PRISMA-ScR guidelines [<xref ref-type="bibr" rid="ref1">1</xref>], it could be considered a high-quality review.</p>
          <p>To retrieve as many relevant studies as possible, the most commonly used databases in the fields of health and information technology were searched. Further, we searched Google Scholar and conducted backward and forward reference list checking to retrieve gray literature and minimize the risk of publication bias.</p>
          <p>As two reviewers independently selected the studies and extracted the data, the selection bias in this review was minimal. This review can be considered a comprehensive review given that we did not apply restrictions regarding the study design, study setting, year of publication, and country of publication.</p>
          <p>Laranjo et al [<xref ref-type="bibr" rid="ref86">86</xref>] reviewed the characteristics, current applications and evaluation measures of health chatbots. In contrast to our work, they did not solely concentrate on the technical metrics used for chatbot evaluations. The metrics they reviewed included task completion or word accuracy. In contrast to Laranjo et al [<xref ref-type="bibr" rid="ref86">86</xref>], who included only 17 papers reporting on 14 different conversational agents, our work is more comprehensive as it included 65 publications. Further, we had a different research question in mind while conducting the review.</p>
        </sec>
        <sec>
          <title>Limitations</title>
          <p>This review focused on chatbots that are aimed at delivering health care services to patients and work on stand-alone software and web browsers; it excluded chatbots that used robotics, serious games, SMS text messaging, Wizard-of-Oz, and telephones. Thus, this review did not include many technical metrics used to evaluate chatbots for other users (eg, physicians, nurses, and caregivers), in other fields (eg, business and education), or with alternative modes of delivery (eg, SMS text messaging, Wizard-of-Oz, and telephones). The abovementioned restrictions were applied by previous reviews about chatbots as these features are not part of ordinary chatbots [<xref ref-type="bibr" rid="ref87">87</xref>-<xref ref-type="bibr" rid="ref90">90</xref>].</p>
          <p>Due to practical constraints, we could not search interdisciplinary databases (eg, Web of Science and ProQuest), conduct a manual search, or contact experts. Further, the search in this review was restricted to English-language studies. Accordingly, it is likely that this review missed some studies.</p>
        </sec>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>From this review, we perceive the need for health chatbot evaluators to consider measurements across a range of aspects in any given study or study series, including usability, social experience, response quality, and, where applicable, classifier performance. The establishment of standard measures would greatly enhance comparability across studies with the SUS and CPS as leading candidates for usability and social experience, respectively. It would be ideal to develop guidelines for health chatbot evaluators indicating what should be measured and at what stages in product development. Development of validated measurement instruments in this domain is sparse and such instruments would benefit the field, especially for response quality metrics.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Search string.</p>
        <media xlink:href="jmir_v22i6e18301_app1.docx" xlink:title="DOCX File , 19 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Data extraction form.</p>
        <media xlink:href="jmir_v22i6e18301_app2.docx" xlink:title="DOCX File , 17 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Metadata and population characteristics of each included study.</p>
        <media xlink:href="jmir_v22i6e18301_app3.docx" xlink:title="DOCX File , 24 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Characteristics of the intervention in each included study.</p>
        <media xlink:href="jmir_v22i6e18301_app4.docx" xlink:title="DOCX File , 23 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ACM</term>
          <def>
            <p>Association for Computing Machinery</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CINAHL</term>
          <def>
            <p>Cumulative Index of Nursing and Allied Health Literature</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">CPS</term>
          <def>
            <p>conversational-turns per session</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">eHealth</term>
          <def>
            <p>electronic health</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">EMBASE</term>
          <def>
            <p>Excerpta Medica Database</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">IEEE</term>
          <def>
            <p>Institute of Electrical and Electronics Engineers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">IR</term>
          <def>
            <p>information retrieval</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">PRISMA-ScR</term>
          <def>
            <p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses-Extension for Scoping Reviews</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">UX</term>
          <def>
            <p>user experience</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <fn-group>
      <fn fn-type="con">
        <p>AA developed the protocol and conducted the search with guidance from and under the supervision of KD and MH. Study selection and data extraction were carried out independently by MA and ZS. AA solved any disagreements between the two reviewers. AA synthesized the data. AA and KD drafted the manuscript, and it was revised critically for important intellectual content by all authors. KD and JW reviewed the related literature and interpreted the results. All authors approved the manuscript for publication and agree to be accountable for all aspects of the work.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weizenbaum</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>ELIZA-a computer program for the study of natural language communication between man and machine</article-title>
          <source>Commun ACM</source>
          <year>1966</year>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>36</fpage>
          <lpage>45</lpage>
          <pub-id pub-id-type="doi">10.1145/365153.365168</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Automated Telephone Conversations to Assess Health Behavior and Deliver Behavioral Interventions</article-title>
          <source>Journal of Medical Systems</source>
          <year>1998</year>
          <month>04</month>
          <day>01</day>
          <volume>22</volume>
          <issue>2</issue>
          <fpage>95</fpage>
          <lpage>102</lpage>
          <pub-id pub-id-type="doi">10.1023/A:1022695119046</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Whittaker</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>McRobbie</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Bullen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rodgers</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Mobile phone-based interventions for smoking cessation</article-title>
          <source>Cochrane Database Syst Rev</source>
          <year>2016</year>
          <volume>4</volume>
          <fpage>CD006611</fpage>
          <pub-id pub-id-type="doi">10.1002/14651858.CD006611.pub4</pub-id>
          <pub-id pub-id-type="medline">27060875</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Neve</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Morgan</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>PR</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>CE</given-names>
            </name>
          </person-group>
          <article-title>Effectiveness of web-based interventions in achieving weight loss and weight loss maintenance in overweight and obese adults: a systematic review with meta-analysis</article-title>
          <source>Obes Rev</source>
          <year>2010</year>
          <month>04</month>
          <volume>11</volume>
          <issue>4</issue>
          <fpage>306</fpage>
          <lpage>21</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1467-789X.2009.00646.x</pub-id>
          <pub-id pub-id-type="medline">19754633</pub-id>
          <pub-id pub-id-type="pii">OBR646</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Webb</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Joseph</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yardley</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Michie</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Using the internet to promote health behavior change: a systematic review and meta-analysis of the impact of theoretical basis, use of behavior change techniques, and mode of delivery on efficacy</article-title>
          <source>J Med Internet Res</source>
          <year>2010</year>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>e4</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmir.org/2010/1/e4/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.1376</pub-id>
          <pub-id pub-id-type="medline">20164043</pub-id>
          <pub-id pub-id-type="pii">v12i1e4</pub-id>
          <pub-id pub-id-type="pmcid">PMC2836773</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kelders</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Kok</surname>
              <given-names>RN</given-names>
            </name>
            <name name-style="western">
              <surname>Ossebaard</surname>
              <given-names>HC</given-names>
            </name>
            <name name-style="western">
              <surname>Van Gemert-Pijnen</surname>
              <given-names>JEWC</given-names>
            </name>
          </person-group>
          <article-title>Persuasive system design does matter: a systematic review of adherence to web-based interventions</article-title>
          <source>J Med Internet Res</source>
          <year>2012</year>
          <month>11</month>
          <day>14</day>
          <volume>14</volume>
          <issue>6</issue>
          <fpage>e152</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2012/6/e152/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.2104</pub-id>
          <pub-id pub-id-type="medline">23151820</pub-id>
          <pub-id pub-id-type="pii">v14i6e152</pub-id>
          <pub-id pub-id-type="pmcid">PMC3510730</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fitzpatrick</surname>
              <given-names>KK</given-names>
            </name>
            <name name-style="western">
              <surname>Darcy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Vierhile</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Delivering Cognitive Behavior Therapy to Young Adults With Symptoms of Depression and Anxiety Using a Fully Automated Conversational Agent (Woebot): A Randomized Controlled Trial</article-title>
          <source>JMIR Ment Health</source>
          <year>2017</year>
          <month>06</month>
          <day>06</day>
          <volume>4</volume>
          <issue>2</issue>
          <fpage>e19</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://mental.jmir.org/2017/2/e19/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/mental.7785</pub-id>
          <pub-id pub-id-type="medline">28588005</pub-id>
          <pub-id pub-id-type="pii">v4i2e19</pub-id>
          <pub-id pub-id-type="pmcid">PMC5478797</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gulshan</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Coram</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stumpe</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Narayanaswamy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Venugopalan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Widner</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Madams</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Cuadros</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Raman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Nelson</surname>
              <given-names>PC</given-names>
            </name>
            <name name-style="western">
              <surname>Mega</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Webster</surname>
              <given-names>DR</given-names>
            </name>
          </person-group>
          <article-title>Development and Validation of a Deep Learning Algorithm for Detection of Diabetic Retinopathy in Retinal Fundus Photographs</article-title>
          <source>JAMA</source>
          <year>2016</year>
          <month>12</month>
          <day>13</day>
          <volume>316</volume>
          <issue>22</issue>
          <fpage>2402</fpage>
          <lpage>2410</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2016.17216</pub-id>
          <pub-id pub-id-type="medline">27898976</pub-id>
          <pub-id pub-id-type="pii">2588763</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stead</surname>
              <given-names>WW</given-names>
            </name>
          </person-group>
          <article-title>Clinical Implications and Challenges of Artificial Intelligence and Deep Learning</article-title>
          <source>JAMA</source>
          <year>2018</year>
          <month>09</month>
          <day>18</day>
          <volume>320</volume>
          <issue>11</issue>
          <fpage>1107</fpage>
          <lpage>1108</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2018.11029</pub-id>
          <pub-id pub-id-type="medline">30178025</pub-id>
          <pub-id pub-id-type="pii">2701665</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Shum</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>The Design and Implementation of XiaoIce, an Empathetic Social Chatbot</article-title>
          <source>Computational Linguistics</source>
          <year>2020</year>
          <month>03</month>
          <volume>46</volume>
          <issue>1</issue>
          <fpage>53</fpage>
          <lpage>93</lpage>
          <pub-id pub-id-type="doi">10.1162/coli_a_00368</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kroenke</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Spitzer</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>JB</given-names>
            </name>
          </person-group>
          <article-title>The PHQ-9: validity of a brief depression severity measure</article-title>
          <source>J Gen Intern Med</source>
          <year>2001</year>
          <month>09</month>
          <volume>16</volume>
          <issue>9</issue>
          <fpage>606</fpage>
          <lpage>13</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/11556941"/>
          </comment>
          <pub-id pub-id-type="medline">11556941</pub-id>
          <pub-id pub-id-type="pii">jgi01114</pub-id>
          <pub-id pub-id-type="pmcid">PMC1495268</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Conlin</surname>
              <given-names>PR</given-names>
            </name>
            <name name-style="western">
              <surname>Colburn</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Aron</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Pries</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Tschanz</surname>
              <given-names>MP</given-names>
            </name>
            <name name-style="western">
              <surname>Pogach</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Synopsis of the 2017 U.S. Department of Veterans Affairs/U.S. Department of Defense Clinical Practice Guideline: Management of Type 2 Diabetes Mellitus</article-title>
          <source>Ann Intern Med</source>
          <year>2017</year>
          <month>11</month>
          <day>07</day>
          <volume>167</volume>
          <issue>9</issue>
          <fpage>655</fpage>
          <lpage>663</lpage>
          <pub-id pub-id-type="doi">10.7326/M17-1362</pub-id>
          <pub-id pub-id-type="medline">29059687</pub-id>
          <pub-id pub-id-type="pii">2659342</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kocaballi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Quiroz</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rezazadegan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Berkovsky</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Magrabi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Coiera</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Responses of Conversational Agents to Health and Lifestyle Prompts: Investigation of Appropriateness and Presentation Structures</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <volume>22</volume>
          <issue>2</issue>
          <fpage>e15823</fpage>
          <pub-id pub-id-type="doi">10.2196/preprints.15823</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Denecke</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Warren</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>How to Evaluate Health Applications with Conversational User Interface?</article-title>
          <source>Studies in Health Technology and Informatics</source>
          <year>2020</year>
          <fpage>1</fpage>
          <lpage>9</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tricco</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Lillie</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Zarin</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>O'Brien</surname>
              <given-names>KK</given-names>
            </name>
            <name name-style="western">
              <surname>Colquhoun</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Levac</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Moher</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Horsley</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Weeks</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hempel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Akl</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>McGowan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hartling</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Aldcroft</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Garritty</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lewin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Godfrey</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Macdonald</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Langlois</surname>
              <given-names>EV</given-names>
            </name>
            <name name-style="western">
              <surname>Soares-Weiser</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Moriarty</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Clifford</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tunçalp</surname>
              <given-names>Ö</given-names>
            </name>
            <name name-style="western">
              <surname>Straus</surname>
              <given-names>SE</given-names>
            </name>
          </person-group>
          <article-title>PRISMA Extension for Scoping Reviews (PRISMA-ScR): Checklist and Explanation</article-title>
          <source>Ann Intern Med</source>
          <year>2018</year>
          <month>10</month>
          <day>02</day>
          <volume>169</volume>
          <issue>7</issue>
          <fpage>467</fpage>
          <lpage>473</lpage>
          <pub-id pub-id-type="doi">10.7326/M18-0850</pub-id>
          <pub-id pub-id-type="medline">30178033</pub-id>
          <pub-id pub-id-type="pii">2700389</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <source>Practical statistics for medical research</source>
          <year>1990</year>
          <publisher-loc>London</publisher-loc>
          <publisher-name>Chapman &#38; Hall/CRC</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abdullah</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Gaehde</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bickmore</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>A Tablet Based Embodied Conversational Agent to Promote Smoking Cessation among Veterans: A Feasibility Study</article-title>
          <source>J Epidemiol Glob Health</source>
          <year>2018</year>
          <month>12</month>
          <volume>8</volume>
          <issue>3-4</issue>
          <fpage>225</fpage>
          <lpage>230</lpage>
          <pub-id pub-id-type="doi">10.2991/j.jegh.2018.08.104</pub-id>
          <pub-id pub-id-type="medline">30864768</pub-id>
          <pub-id pub-id-type="pii">j8/3-4/225</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rasazi</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Mamun</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Langevin</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rawassizadeh</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Schubert</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>A Virtual Conversational Agent for Teens with Autism: Experimental Results and Design Lessons</article-title>
          <source>arXiv</source>
          <year>2018</year>
          <fpage>1</fpage>
          <lpage>13</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Beiley</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>Mental Health And Wellness Chatbot</source>
          <year>2019</year>
          <publisher-loc>United States</publisher-loc>
          <publisher-name>The University of Arizona</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bickmore</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Caruso</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Clough-Gorr</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Acceptance and usability of a relational agent interface by urban older adults</article-title>
          <source>CHI'05 extended abstracts on Human factors in computing systems: ACM</source>
          <year>2005</year>
          <conf-name>CHI EA '05</conf-name>
          <conf-date>April</conf-date>
          <conf-loc>Portland, OR, USA</conf-loc>
          <fpage>1212</fpage>
          <lpage>1215</lpage>
          <pub-id pub-id-type="doi">10.1145/1056808.1056879</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bickmore</surname>
              <given-names>TW</given-names>
            </name>
            <name name-style="western">
              <surname>Pfeifer</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jack</surname>
              <given-names>BW</given-names>
            </name>
          </person-group>
          <article-title>Taking the time to care</article-title>
          <year>2009</year>
          <conf-name>Proceedings of the 27th international conference on Human factors in computing systems - CHI 09</conf-name>
          <conf-date>2009</conf-date>
          <conf-loc>Boston</conf-loc>
          <pub-id pub-id-type="doi">10.1145/1518701.1518891</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bickmore</surname>
              <given-names>TW</given-names>
            </name>
            <name name-style="western">
              <surname>Mitchell</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Jack</surname>
              <given-names>BW</given-names>
            </name>
            <name name-style="western">
              <surname>Paasche-Orlow</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Pfeifer</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Odonnell</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Response to a Relational Agent by Hospital Patients with Depressive Symptoms</article-title>
          <source>Interact Comput</source>
          <year>2010</year>
          <month>07</month>
          <day>01</day>
          <volume>22</volume>
          <issue>4</issue>
          <fpage>289</fpage>
          <lpage>298</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/20628581"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.intcom.2009.12.001</pub-id>
          <pub-id pub-id-type="medline">20628581</pub-id>
          <pub-id pub-id-type="pmcid">PMC2901553</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bickmore</surname>
              <given-names>TW</given-names>
            </name>
            <name name-style="western">
              <surname>Pfeifer</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Byron</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Forsythe</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Henault</surname>
              <given-names>LE</given-names>
            </name>
            <name name-style="western">
              <surname>Jack</surname>
              <given-names>BW</given-names>
            </name>
            <name name-style="western">
              <surname>Silliman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Paasche-Orlow</surname>
              <given-names>MK</given-names>
            </name>
          </person-group>
          <article-title>Usability of conversational agents by patients with inadequate health literacy: evidence from two clinical trials</article-title>
          <source>J Health Commun</source>
          <year>2010</year>
          <volume>15 Suppl 2</volume>
          <fpage>197</fpage>
          <lpage>210</lpage>
          <pub-id pub-id-type="doi">10.1080/10810730.2010.499991</pub-id>
          <pub-id pub-id-type="medline">20845204</pub-id>
          <pub-id pub-id-type="pii">926954323</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bickmore</surname>
              <given-names>TW</given-names>
            </name>
            <name name-style="western">
              <surname>Puskar</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Schlenk</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Pfeifer</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Sereika</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>Maintaining reality: Relational agents for antipsychotic medication adherence</article-title>
          <source>Interacting with Computers</source>
          <year>2010</year>
          <month>7</month>
          <volume>22</volume>
          <issue>4</issue>
          <fpage>276</fpage>
          <lpage>288</lpage>
          <pub-id pub-id-type="doi">10.1016/j.intcom.2010.02.001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bickmore</surname>
              <given-names>TW</given-names>
            </name>
            <name name-style="western">
              <surname>Schulman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sidner</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Automated interventions for multiple health behaviors using conversational agents</article-title>
          <source>Patient Educ Couns</source>
          <year>2013</year>
          <month>08</month>
          <volume>92</volume>
          <issue>2</issue>
          <fpage>142</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23763983"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.pec.2013.05.011</pub-id>
          <pub-id pub-id-type="medline">23763983</pub-id>
          <pub-id pub-id-type="pii">S0738-3991(13)00211-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC3727973</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bresó</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Martínez-Miranda</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Botella</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Baños</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>García-Gómez</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Usability and acceptability assessment of an empathic virtual agent to prevent major depression</article-title>
          <source>Expert Systems</source>
          <year>2016</year>
          <month>05</month>
          <day>25</day>
          <volume>33</volume>
          <issue>4</issue>
          <fpage>297</fpage>
          <lpage>312</lpage>
          <pub-id pub-id-type="doi">10.1111/EXSY.12151</pub-id>
          <pub-id pub-id-type="medline">2016</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cameron</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cameron</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Megaw</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bond</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mulvenna</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>O'Neill</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Assessing the Usability of a Chatbot for Mental Health Care</article-title>
          <source>Internet Science</source>
          <year>2019</year>
          <volume>Cham</volume>
          <fpage>121</fpage>
          <lpage>132</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-030-17705-8_11</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Comendador</surname>
              <given-names>BEV</given-names>
            </name>
            <name name-style="western">
              <surname>Francisco</surname>
              <given-names>BMB</given-names>
            </name>
            <name name-style="western">
              <surname>Medenilla</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Nacion</surname>
              <given-names>SMT</given-names>
            </name>
            <name name-style="western">
              <surname>Serac</surname>
              <given-names>TBE</given-names>
            </name>
          </person-group>
          <article-title>Pharmabot: A Pediatric Generic Medicine Consultant Chatbot</article-title>
          <source>JOACE</source>
          <year>2015</year>
          <volume>3</volume>
          <issue>2</issue>
          <fpage>137</fpage>
          <lpage>140</lpage>
          <pub-id pub-id-type="doi">10.12720/joace.3.2.137-140</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Crutzen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>GY</given-names>
            </name>
            <name name-style="western">
              <surname>Portugal</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Fisser</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Grolleman</surname>
              <given-names>JJ</given-names>
            </name>
          </person-group>
          <article-title>An artificially intelligent chat agent that answers adolescents' questions related to sex, drugs, and alcohol: an exploratory study</article-title>
          <source>J Adolesc Health</source>
          <year>2011</year>
          <month>05</month>
          <volume>48</volume>
          <issue>5</issue>
          <fpage>514</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jadohealth.2010.09.002</pub-id>
          <pub-id pub-id-type="medline">21501812</pub-id>
          <pub-id pub-id-type="pii">S1054-139X(10)00430-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Demirci</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <source>User experience over time with conversational agents case study of woebot on supporting subjective well-being</source>
          <year>2018</year>
          <publisher-loc>Turkey</publisher-loc>
          <publisher-name>Middle East Technical University</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Denecke</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Hochreutener</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pöpel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>May</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Self-Anamnesis with a Conversational User Interface: Concept and Usability Study</article-title>
          <source>Methods Inf Med</source>
          <year>2019</year>
          <month>03</month>
          <day>15</day>
          <volume>57</volume>
          <issue>05/06</issue>
          <fpage>243</fpage>
          <lpage>252</lpage>
          <pub-id pub-id-type="doi">10.1055/s-0038-1675822</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>DeVault</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Artstein</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Benn</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Dey</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fast</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gainer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Georgila</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gratch</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hartholt</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lhommet</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lucas</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Marsella</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Morbini</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Nazarian</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Scherer</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Stratou</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Suri</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Traum</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wood</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rizzo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Morency</surname>
              <given-names>LP</given-names>
            </name>
          </person-group>
          <article-title>SimSensei kiosk: a virtual human interviewer for healthcare decision support</article-title>
          <year>2014</year>
          <conf-name>International Foundation for Autonomous Agents and Multiagent Systems</conf-name>
          <conf-date>May 2014</conf-date>
          <conf-loc>Paris</conf-loc>
          <fpage>1061</fpage>
          <lpage>1068</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dworkin</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chakraborty</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Monahan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hightow-Weidman</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Garofalo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Qato</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jimenez</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Acceptability, Feasibility, and Preliminary Efficacy of a Theory-Based Relational Embodied Conversational Agent Mobile Phone Intervention to Promote HIV Medication Adherence in Young HIV-Positive African American MSM</article-title>
          <source>AIDS Educ Prev</source>
          <year>2019</year>
          <month>02</month>
          <volume>31</volume>
          <issue>1</issue>
          <fpage>17</fpage>
          <lpage>37</lpage>
          <pub-id pub-id-type="doi">10.1521/aeap.2019.31.1.17</pub-id>
          <pub-id pub-id-type="medline">30742481</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Elmasri</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Maeder</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A Conversational Agent for an Online Mental Health Intervention</article-title>
          <source>Brain Informatics and Health: International Conference</source>
          <year>2016</year>
          <conf-name>Brain Informatics and Health 2016</conf-name>
          <conf-date>October 13-16</conf-date>
          <conf-loc>Omaha, NE, USA</conf-loc>
          <fpage>243</fpage>
          <lpage>251</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-319-47103-7_24</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fadhil</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schiavo</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Villafiorita</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fondazione</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>OlloBot-Towards A Text-Based Arabic Health Conversational Agentvaluation and Results</article-title>
          <year>2019</year>
          <conf-name>Proceedings of Recent Advances in Natural Language Processing</conf-name>
          <conf-date>2019</conf-date>
          <conf-loc>Varna</conf-loc>
          <fpage>295</fpage>
          <lpage>303</lpage>
          <pub-id pub-id-type="doi">10.26615/978-954-452-056-4_034</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Griol</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Callejas</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Mobile Conversational Agents for Context-Aware Care Applications</article-title>
          <source>Cogn Comput</source>
          <year>2015</year>
          <month>8</month>
          <day>21</day>
          <volume>8</volume>
          <issue>2</issue>
          <fpage>336</fpage>
          <lpage>356</lpage>
          <pub-id pub-id-type="doi">10.1007/s12559-015-9352-x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hanke</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sandner</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kadyrov</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Stainer-Hochgatterer</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Daily life support at home through a virtual support partner</article-title>
          <year>2016</year>
          <conf-name>2nd IET International Conference on Technologies for Active and Assisted Living (TechAAL)</conf-name>
          <conf-date>2016</conf-date>
          <conf-loc>London</conf-loc>
          <fpage>1</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1049/ic.2016.0058</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hess</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Fricker</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Denecke</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Improving and Evaluating eMMA?s Communication Skills: A Chatbot for Managing Medication</article-title>
          <source>Studies in health technology and informatics</source>
          <year>2019</year>
          <volume>259</volume>
          <fpage>101</fpage>
          <lpage>104</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kadariya</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Venkataramanan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Yip</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kalra</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Thirunarayanan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Sheth</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>kBot: Knowledge-Enabled Personalized Chatbot for Asthma Self-Management</article-title>
          <year>2019</year>
          <conf-name>IEEE International Conference on Smart Computing (SMARTCOMP)</conf-name>
          <conf-date>2019</conf-date>
          <conf-loc>Washington</conf-loc>
          <fpage>138</fpage>
          <lpage>143</lpage>
          <pub-id pub-id-type="doi">10.1109/smartcomp.2019.00043</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kowatsch</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Otto</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Harperink</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cotti</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schlieter</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>A design and evaluation framework for digital health interventions</article-title>
          <source>IT - Information Technology</source>
          <year>2019</year>
          <volume>61</volume>
          <issue>5-6</issue>
          <fpage>253</fpage>
          <lpage>263</lpage>
          <pub-id pub-id-type="doi">10.1515/itit-2019-0019</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lisetti</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Amini</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Yasavur</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Rishe</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>I Can Help You Change! An Empathic Virtual Agent Delivers Behavior Change Health Interventions</article-title>
          <source>ACM Trans Manage Inf Syst</source>
          <year>2013</year>
          <month>12</month>
          <day>01</day>
          <volume>4</volume>
          <issue>4</issue>
          <fpage>1</fpage>
          <lpage>28</lpage>
          <pub-id pub-id-type="doi">10.1145/2544103</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Magnani</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Schlusser</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Kimani</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rollman</surname>
              <given-names>BL</given-names>
            </name>
            <name name-style="western">
              <surname>Paasche-Orlow</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Bickmore</surname>
              <given-names>TW</given-names>
            </name>
          </person-group>
          <article-title>The Atrial Fibrillation Health Literacy Information Technology System: Pilot Assessment</article-title>
          <source>JMIR Cardio</source>
          <year>2017</year>
          <volume>1</volume>
          <issue>2</issue>
          <fpage>e7</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29473644"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/cardio.8543</pub-id>
          <pub-id pub-id-type="medline">29473644</pub-id>
          <pub-id pub-id-type="pmcid">PMC5818980</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Micoulaud-Franchi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sagaspe</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>de</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Bioulac</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sauteraud</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Philip</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Acceptability of Embodied Conversational Agent in a Health Care Context</article-title>
          <source>Intelligent Virtual Agents</source>
          <year>2016</year>
          <fpage>416</fpage>
          <lpage>419</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-319-47665-0_45</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Milne</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Luerssen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lewis</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Leibbrandt</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Powers</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Development of a virtual agent based social tutor for children with autism spectrum disorders. The 2010 International Joint Conference on Neural Networks (IJCNN)</article-title>
          <year>2010</year>
          <conf-name>The 2010 International Joint Conference on Neural Networks (IJCNN)</conf-name>
          <conf-date>2010  July 2010</conf-date>
          <conf-loc>Barcelona</conf-loc>
          <fpage>18</fpage>
          <lpage>23</lpage>
          <pub-id pub-id-type="doi">10.1109/ijcnn.2010.5596584</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schmidlen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>DiLoreto</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kirchner</surname>
              <given-names>HL</given-names>
            </name>
            <name name-style="western">
              <surname>Sturm</surname>
              <given-names>AC</given-names>
            </name>
          </person-group>
          <article-title>Patient assessment of chatbots for the scalable delivery of genetic counseling</article-title>
          <source>J Genet Couns</source>
          <year>2019</year>
          <month>12</month>
          <volume>28</volume>
          <issue>6</issue>
          <fpage>1166</fpage>
          <lpage>1177</lpage>
          <pub-id pub-id-type="doi">10.1002/jgc4.1169</pub-id>
          <pub-id pub-id-type="medline">31549758</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schroeder</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wilkes</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rowan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toledo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Paradiso</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Czerwinski</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Pocket Skills: A Conversational Mobile Web App To Support Dialectical Behavioral Therapy</article-title>
          <year>2018</year>
          <conf-name>The 2018 CHI Conference on Human Factors in Computing Systems</conf-name>
          <conf-date>2018</conf-date>
          <conf-loc>Montreal</conf-loc>
          <publisher-loc>Canada</publisher-loc>
          <publisher-name>ACM</publisher-name>
          <fpage>1</fpage>
          <lpage>15</lpage>
          <pub-id pub-id-type="doi">10.1145/3173574.3173972</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ginger</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Boteler Humm</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Olsen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Fleming</surname>
              <given-names>MF</given-names>
            </name>
          </person-group>
          <article-title>Virtual reality job interview training for individuals with psychiatric disabilities</article-title>
          <source>J Nerv Ment Dis</source>
          <year>2014</year>
          <month>09</month>
          <volume>202</volume>
          <issue>9</issue>
          <fpage>659</fpage>
          <lpage>67</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25099298"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/NMD.0000000000000187</pub-id>
          <pub-id pub-id-type="medline">25099298</pub-id>
          <pub-id pub-id-type="pmcid">PMC4149584</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ginger</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Humm</surname>
              <given-names>LB</given-names>
            </name>
            <name name-style="western">
              <surname>Olsen</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Fleming</surname>
              <given-names>MF</given-names>
            </name>
          </person-group>
          <article-title>Virtual reality job interview training in adults with autism spectrum disorder</article-title>
          <source>J Autism Dev Disord</source>
          <year>2014</year>
          <month>10</month>
          <volume>44</volume>
          <issue>10</issue>
          <fpage>2450</fpage>
          <lpage>63</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24803366"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s10803-014-2113-y</pub-id>
          <pub-id pub-id-type="medline">24803366</pub-id>
          <pub-id pub-id-type="pmcid">PMC4167908</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Humm</surname>
              <given-names>LB</given-names>
            </name>
            <name name-style="western">
              <surname>Fleming</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Ginger</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Olsen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>MD</given-names>
            </name>
          </person-group>
          <article-title>Virtual Reality Job Interview Training for Veterans with Posttraumatic Stress Disorder</article-title>
          <source>J Vocat Rehabil</source>
          <year>2015</year>
          <volume>42</volume>
          <issue>3</issue>
          <fpage>271</fpage>
          <lpage>279</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27721645"/>
          </comment>
          <pub-id pub-id-type="doi">10.3233/JVR-150748</pub-id>
          <pub-id pub-id-type="medline">27721645</pub-id>
          <pub-id pub-id-type="pmcid">PMC5051574</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tanaka</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Sakti</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Neubig</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Toda</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Negoro</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Iwasaka</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Automated Social Skills Trainer</article-title>
          <year>2015</year>
          <conf-name>The 20th International Conference on Intelligent User Interfaces</conf-name>
          <conf-date>2015</conf-date>
          <conf-loc>Atlanta</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2678025.2701368</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thompson</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Callender</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gonynor</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cullen</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Redondo</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Butler</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>BJ</given-names>
            </name>
          </person-group>
          <article-title>Using Relational Agents to Promote Family Communication Around Type 1 Diabetes Self-Management in the Diabetes Family Teamwork Online Intervention: Longitudinal Pilot Study</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>09</month>
          <day>13</day>
          <volume>21</volume>
          <issue>9</issue>
          <fpage>e15318</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/9/e15318/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/15318</pub-id>
          <pub-id pub-id-type="medline">31538940</pub-id>
          <pub-id pub-id-type="pii">v21i9e15318</pub-id>
          <pub-id pub-id-type="pmcid">PMC6754689</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tielman</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Neerincx</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Bidarra</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kybartas</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Brinkman</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>A Therapy System for Post-Traumatic Stress Disorder Using a Virtual Agent and Virtual Storytelling to Reconstruct Traumatic Memories</article-title>
          <source>J Med Syst</source>
          <year>2017</year>
          <month>08</month>
          <volume>41</volume>
          <issue>8</issue>
          <fpage>125</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28699083"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s10916-017-0771-y</pub-id>
          <pub-id pub-id-type="medline">28699083</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10916-017-0771-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC5506234</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yasavur</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Lisetti</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rishe</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Let’s talk! speaking virtual counselor offers you a brief intervention</article-title>
          <source>J Multimodal User Interfaces</source>
          <year>2014</year>
          <month>9</month>
          <day>5</day>
          <volume>8</volume>
          <issue>4</issue>
          <fpage>381</fpage>
          <lpage>398</lpage>
          <pub-id pub-id-type="doi">10.1007/s12193-014-0169-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Amato</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Marrone</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Moscato</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Piantadosi</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Picariello</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sansone</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Chatbots Meet eHealth: Automatizing Healthcare</article-title>
          <year>2017</year>
          <conf-name>Workshop on Artificial Intelligence with Application in Health</conf-name>
          <conf-date>2017</conf-date>
          <conf-loc>Bari</conf-loc>
          <fpage>1</fpage>
          <lpage>10</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Auriacombe</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Moriceau</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Serre</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Denis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Micoulaud-Franchi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>de Sevin</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bonhomme</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bioulac</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fatseas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Philip</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Development and validation of a virtual agent to screen tobacco and alcohol use disorders</article-title>
          <source>Drug and Alcohol Dependence</source>
          <year>2018</year>
          <month>12</month>
          <volume>193</volume>
          <issue>6</issue>
          <fpage>1</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1016/J.drugalcdep.2018.08.025</pub-id>
          <pub-id pub-id-type="medline">2018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ghosh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bhatia</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bhatia</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Quro: Facilitating User Symptom Check Using a Personalised Chatbot-Oriented Dialogue System</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2018</year>
          <volume>252</volume>
          <fpage>51</fpage>
          <lpage>56</lpage>
          <pub-id pub-id-type="medline">30040682</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Inkster</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Sarda</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Subramanian</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>An Empathy-Driven, Conversational Artificial Intelligence Agent (Wysa) for Digital Mental Well-Being: Real-World Data Evaluation Mixed-Methods Study</article-title>
          <source>JMIR mHealth uHealth</source>
          <year>2018</year>
          <month>11</month>
          <day>23</day>
          <volume>6</volume>
          <issue>11</issue>
          <fpage>e12106</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://mhealth.jmir.org/2018/11/e12106/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/12106</pub-id>
          <pub-id pub-id-type="medline">30470676</pub-id>
          <pub-id pub-id-type="pii">v6i11e12106</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ni</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>MANDY: Towards a Smart Primary Care Chatbot Application</article-title>
          <source>Knowledge and Systems Sciences</source>
          <year>2017</year>
          <fpage>38</fpage>
          <lpage>52</lpage>
          <pub-id pub-id-type="doi">10.1007/978-981-10-6989-5_4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Philip</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bioulac</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sauteraud</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chaufton</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Olive</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Could a Virtual Human Be Used to Explore Excessive Daytime Sleepiness in Patients?</article-title>
          <source>Presence: Teleoperators and Virtual Environments</source>
          <year>2014</year>
          <month>11</month>
          <volume>23</volume>
          <issue>4</issue>
          <fpage>369</fpage>
          <lpage>376</lpage>
          <pub-id pub-id-type="doi">10.1162/pres_a_00197</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Philip</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Micoulaud-Franchi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sagaspe</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sevin</surname>
              <given-names>ED</given-names>
            </name>
            <name name-style="western">
              <surname>Olive</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bioulac</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sauteraud</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Virtual human as a new diagnostic tool, a proof of concept study in the field of major depressive disorders</article-title>
          <source>Sci Rep</source>
          <year>2017</year>
          <month>02</month>
          <day>16</day>
          <volume>7</volume>
          <fpage>42656</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.doi.org/10.1038/srep42656"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/srep42656</pub-id>
          <pub-id pub-id-type="medline">28205601</pub-id>
          <pub-id pub-id-type="pii">srep42656</pub-id>
          <pub-id pub-id-type="pmcid">PMC5311989</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tanaka</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Adachi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ukita</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ikeda</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kazui</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kudo</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Nakamura</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Detecting Dementia Through Interactive Computer Avatars</article-title>
          <source>IEEE J Transl Eng Health Med</source>
          <year>2017</year>
          <volume>5</volume>
          <fpage>1</fpage>
          <lpage>11</lpage>
          <pub-id pub-id-type="doi">10.1109/jtehm.2017.2752152</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gardiner</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>McCue</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>Negash</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>White</surname>
              <given-names>LF</given-names>
            </name>
            <name name-style="western">
              <surname>Yinusa-Nyahkoon</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jack</surname>
              <given-names>BW</given-names>
            </name>
            <name name-style="western">
              <surname>Bickmore</surname>
              <given-names>TW</given-names>
            </name>
          </person-group>
          <article-title>Engaging women with an embodied conversational agent to deliver mindfulness and lifestyle recommendations: A feasibility randomized control trial</article-title>
          <source>Patient Educ Couns</source>
          <year>2017</year>
          <month>09</month>
          <volume>100</volume>
          <issue>9</issue>
          <fpage>1720</fpage>
          <lpage>1729</lpage>
          <pub-id pub-id-type="doi">10.1016/j.pec.2017.04.015</pub-id>
          <pub-id pub-id-type="medline">28495391</pub-id>
          <pub-id pub-id-type="pii">S0738-3991(17)30249-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC5559098</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Razavi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Schubert</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hoque</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The LISSA virtual human and ASD teens: An overview of initial experiments</article-title>
          <year>2016</year>
          <conf-name>International Conference on Intelligent Virtual Agents</conf-name>
          <conf-date>2016</conf-date>
          <conf-loc>Los Angeles</conf-loc>
          <fpage>460</fpage>
          <lpage>463</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-319-47665-0_55</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Sundar</surname>
              <given-names>SS</given-names>
            </name>
          </person-group>
          <article-title>Should Machines Express Sympathy and Empathy? Experiments with a Health Advice Chatbot</article-title>
          <source>Cyberpsychol Behav Soc Netw</source>
          <year>2018</year>
          <month>10</month>
          <volume>21</volume>
          <issue>10</issue>
          <fpage>625</fpage>
          <lpage>636</lpage>
          <pub-id pub-id-type="doi">10.1089/cyber.2018.0110</pub-id>
          <pub-id pub-id-type="medline">30334655</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Turunen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hakulinen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ståhl</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Gambäck</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Hansen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rodríguez Gancedo</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>de la Cámara</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Charlton</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cavazza</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Multimodal and mobile conversational Health and Fitness Companions</article-title>
          <source>Computer Speech &#38; Language</source>
          <year>2011</year>
          <month>4</month>
          <volume>25</volume>
          <issue>2</issue>
          <fpage>192</fpage>
          <lpage>209</lpage>
          <pub-id pub-id-type="doi">10.1016/j.csl.2010.04.004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Burton</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Szentagotai Tatar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>McKinstry</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Matheson</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Matu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Moldovan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Macnab</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Farrow</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>David</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Pagliari</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Serrano Blanco</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wolters</surname>
              <given-names>M</given-names>
            </name>
            <collab>Help4Mood Consortium</collab>
          </person-group>
          <article-title>Pilot randomised controlled trial of Help4Mood, an embodied virtual agent-based system to support treatment of depression</article-title>
          <source>J Telemed Telecare</source>
          <year>2016</year>
          <month>09</month>
          <volume>22</volume>
          <issue>6</issue>
          <fpage>348</fpage>
          <lpage>55</lpage>
          <pub-id pub-id-type="doi">10.1177/1357633X15609793</pub-id>
          <pub-id pub-id-type="medline">26453910</pub-id>
          <pub-id pub-id-type="pii">1357633X15609793</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Swartout</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Artstein</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Forbell</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Foutz</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lane</surname>
              <given-names>HC</given-names>
            </name>
            <name name-style="western">
              <surname>Lange</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Morie</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Rizzo</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Traum</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Virtual Humans for Learning</article-title>
          <source>AIMag</source>
          <year>2013</year>
          <month>12</month>
          <day>15</day>
          <volume>34</volume>
          <issue>4</issue>
          <fpage>13</fpage>
          <pub-id pub-id-type="doi">10.1609/aimag.v34i4.2487</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van Heerden</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ntinga</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Vilakazi</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>The potential of conversational agents to provide a rapid HIV counseling and testing services</article-title>
          <year>2017</year>
          <conf-name>International Conference on the Frontiers and Advances in Data Science</conf-name>
          <conf-date>2017</conf-date>
          <conf-loc>Xi'an</conf-loc>
          <fpage>80</fpage>
          <lpage>85</lpage>
          <pub-id pub-id-type="doi">10.1109/fads.2017.8253198</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wargnier</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Benveniste</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jouvelot</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rigaud</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Usability assessment of interaction management support in LOUISE, an ECA-based user interface for elders with cognitive impairment</article-title>
          <source>TAD</source>
          <year>2018</year>
          <month>11</month>
          <day>26</day>
          <volume>30</volume>
          <issue>3</issue>
          <fpage>105</fpage>
          <lpage>126</lpage>
          <pub-id pub-id-type="doi">10.3233/tad-180189</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>“Give Me the Support I Want!”: The Effect of Matching an Embodied Conversational Agent’s Social Support to Users’ Social Support Needs in Fostering Positive User-Agent Interaction</article-title>
          <year>2018</year>
          <conf-name>The 6th International Conference on Human-Agent Interaction</conf-name>
          <conf-date>2018</conf-date>
          <conf-loc>Southampton</conf-loc>
          <fpage>106</fpage>
          <lpage>113</lpage>
          <pub-id pub-id-type="doi">10.1145/3284432.3284462</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Olafsson</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>O'Leary</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Bickmore</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Coerced Change-talk with Conversational Agents Promotes Confidence in Behavior Change</article-title>
          <year>2019</year>
          <conf-name>The 13th EAI International Conference on Pervasive Computing Technologies for Healthcare</conf-name>
          <conf-date>2019</conf-date>
          <conf-loc>Trento</conf-loc>
          <fpage>31</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1145/3329189.3329202</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tielman</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Neerincx</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>van Meggelen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Franken</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Brinkman</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>How should a virtual agent present psychoeducation? Influence of verbal and textual presentation on adherence</article-title>
          <source>Technol Health Care</source>
          <year>2017</year>
          <month>12</month>
          <day>04</day>
          <volume>25</volume>
          <issue>6</issue>
          <fpage>1081</fpage>
          <lpage>1096</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28800346"/>
          </comment>
          <pub-id pub-id-type="doi">10.3233/THC-170899</pub-id>
          <pub-id pub-id-type="medline">28800346</pub-id>
          <pub-id pub-id-type="pii">THC170899</pub-id>
          <pub-id pub-id-type="pmcid">PMC5814660</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fulmer</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Joerin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gentile</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lakerink</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Rauws</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Using Psychological Artificial Intelligence (Tess) to Relieve Symptoms of Depression and Anxiety: Randomized Controlled Trial</article-title>
          <source>JMIR Ment Health</source>
          <year>2018</year>
          <month>12</month>
          <day>13</day>
          <volume>5</volume>
          <issue>4</issue>
          <fpage>e64</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://mental.jmir.org/2018/4/e64/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/mental.9782</pub-id>
          <pub-id pub-id-type="medline">30545815</pub-id>
          <pub-id pub-id-type="pii">v5i4e64</pub-id>
          <pub-id pub-id-type="pmcid">PMC6315222</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Martínez-Miranda</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bresó</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>García-Gómez</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Look on the bright side: a model of cognitive change in virtual agents</article-title>
          <year>2014</year>
          <conf-name>International Conference on Intelligent Virtual Agents</conf-name>
          <conf-date>2014</conf-date>
          <conf-loc>Boston</conf-loc>
          <fpage>285</fpage>
          <lpage>294</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-319-09767-1_37</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bickmore</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <source>Relational agents affecting change through human-computer relationships</source>
          <year>2003</year>
          <publisher-loc>USA</publisher-loc>
          <publisher-name>Massachusetts Institute of Technology</publisher-name>
          <fpage>1</fpage>
          <lpage>284</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ly</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Ly</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Andersson</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>A fully automated conversational agent for promoting mental well-being: A pilot RCT using mixed methods</article-title>
          <source>Internet Interventions</source>
          <year>2017</year>
          <month>12</month>
          <volume>10</volume>
          <fpage>39</fpage>
          <lpage>46</lpage>
          <pub-id pub-id-type="doi">10.1016/j.invent.2017.10.002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Martínez-Miranda</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Martínez</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ramos</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Aguilar</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Jiménez</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Arias</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rosales</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Valencia</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Assessment of users' acceptability of a mobile-based embodied conversational agent for the prevention and detection of suicidal behaviour</article-title>
          <source>J Med Syst</source>
          <year>2019</year>
          <month>06</month>
          <day>25</day>
          <volume>43</volume>
          <issue>8</issue>
          <fpage>246</fpage>
          <pub-id pub-id-type="doi">10.1007/s10916-019-1387-1</pub-id>
          <pub-id pub-id-type="medline">31240494</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10916-019-1387-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pinto</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Greenblatt</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Hickman</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Rice</surname>
              <given-names>HM</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Clochesy</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Assessing the Critical Parameters of eSMART-MH: A Promising Avatar-Based Digital Therapeutic Intervention to Reduce Depressive Symptoms</article-title>
          <source>Perspect Psychiatr Care</source>
          <year>2016</year>
          <month>07</month>
          <volume>52</volume>
          <issue>3</issue>
          <fpage>157</fpage>
          <lpage>68</lpage>
          <pub-id pub-id-type="doi">10.1111/ppc.12112</pub-id>
          <pub-id pub-id-type="medline">25800698</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref79">
        <label>79</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yokotani</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Takagi</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Wakashima</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Advantages of virtual agents over clinical psychologists during comprehensive mental health interviews using a mixed methods design</article-title>
          <source>Computers in Human Behavior</source>
          <year>2018</year>
          <month>08</month>
          <volume>85</volume>
          <issue>6</issue>
          <fpage>135</fpage>
          <lpage>145</lpage>
          <pub-id pub-id-type="doi">10.1016/j.chb.2018.03.045</pub-id>
          <pub-id pub-id-type="medline">2018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref80">
        <label>80</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Samant</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Squibbs</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chaet</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Morshedi</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Barnes</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Design of Interactive Cancer Education Technology for Latina Farmworkers</article-title>
          <year>2014</year>
          <month>04</month>
          <conf-name>The 2014 IEEE International Symposium on Software Reliability Engineering Workshops</conf-name>
          <conf-date>2014</conf-date>
          <conf-loc>Washington</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29978858"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/SIEDS.2014.6829908</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref81">
        <label>81</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jadeja</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Varia</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Perspectives for evaluating conversational AI</article-title>
          <source>arXiv preprint</source>
          <year>2017</year>
          <fpage>1</fpage>
          <lpage>6</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref82">
        <label>82</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bangor</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kortum</surname>
              <given-names>PT</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>JT</given-names>
            </name>
          </person-group>
          <article-title>An Empirical Evaluation of the System Usability Scale</article-title>
          <source>International Journal of Human-Computer Interaction</source>
          <year>2008</year>
          <month>07</month>
          <day>30</day>
          <volume>24</volume>
          <issue>6</issue>
          <fpage>574</fpage>
          <lpage>594</lpage>
          <pub-id pub-id-type="doi">10.1080/10447310802205776</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref83">
        <label>83</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brooke</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>McClelland</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Weerdmeester</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>SUS-A quick and dirty usability scale</article-title>
          <source>Usability evaluation in industry</source>
          <year>1996</year>
          <publisher-loc>London</publisher-loc>
          <publisher-name>CRC Press</publisher-name>
          <fpage>4</fpage>
          <lpage>7</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref84">
        <label>84</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Holmes</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Moorhead</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bond</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Coates</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>McTear</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Can we use conventional methods to assess conversational user interfaces?</article-title>
          <year>2019</year>
          <conf-name>The 31st European Conference on Cognitive Ergonomics</conf-name>
          <conf-date>2019</conf-date>
          <conf-loc>Belfast</conf-loc>
          <publisher-loc>Usability testing of a healthcare chatbot</publisher-loc>
          <fpage>207</fpage>
          <lpage>2014</lpage>
          <pub-id pub-id-type="doi">10.1145/3335082.3335094</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref85">
        <label>85</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shum</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>From Eliza to XiaoIce: challenges and opportunities with social chatbots</article-title>
          <source>Frontiers Inf Technol Electronic Eng</source>
          <year>2018</year>
          <month>1</month>
          <day>8</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>10</fpage>
          <lpage>26</lpage>
          <pub-id pub-id-type="doi">10.1631/fitee.1700826</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref86">
        <label>86</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Laranjo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dunn</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Tong</surname>
              <given-names>HL</given-names>
            </name>
            <name name-style="western">
              <surname>Kocaballi</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bashir</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Surian</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gallego</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Magrabi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lau</surname>
              <given-names>AYS</given-names>
            </name>
            <name name-style="western">
              <surname>Coiera</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Conversational agents in healthcare: a systematic review</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2018</year>
          <month>09</month>
          <day>01</day>
          <volume>25</volume>
          <issue>9</issue>
          <fpage>1248</fpage>
          <lpage>1258</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30010941"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocy072</pub-id>
          <pub-id pub-id-type="medline">30010941</pub-id>
          <pub-id pub-id-type="pii">5052181</pub-id>
          <pub-id pub-id-type="pmcid">PMC6118869</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref87">
        <label>87</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abd-alrazaq</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Alajlani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Alalwan</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Bewick</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Gardner</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Househ</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>An overview of the features of chatbots in mental health: A scoping review</article-title>
          <source>International Journal of Medical Informatics</source>
          <year>2019</year>
          <month>12</month>
          <volume>132</volume>
          <fpage>103978</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2019.103978</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref88">
        <label>88</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abd-alrazaq</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rababeh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Alajlani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bewick</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Househ</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The effectiveness and safety of using chatbots to improve mental health: A systematic review and meta-analysis</article-title>
          <source>Journal of Medical Internet Research. Forthcoming</source>
          <year>2020</year>
          <fpage>2020</fpage>
          <comment>(forthcoming)</comment>
          <pub-id pub-id-type="doi">10.2196/16021</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref89">
        <label>89</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vaidyam</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Wisniewski</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Halamka</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Kashavan</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Torous</surname>
              <given-names>JB</given-names>
            </name>
          </person-group>
          <article-title>Chatbots and Conversational Agents in Mental Health: A Review of the Psychiatric Landscape</article-title>
          <source>Can J Psychiatry</source>
          <year>2019</year>
          <month>07</month>
          <volume>64</volume>
          <issue>7</issue>
          <fpage>456</fpage>
          <lpage>464</lpage>
          <pub-id pub-id-type="doi">10.1177/0706743719828977</pub-id>
          <pub-id pub-id-type="medline">30897957</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref90">
        <label>90</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Provoost</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lau</surname>
              <given-names>HM</given-names>
            </name>
            <name name-style="western">
              <surname>Ruwaard</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Riper</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Embodied Conversational Agents in Clinical Psychology: A Scoping Review</article-title>
          <source>J Med Internet Res</source>
          <year>2017</year>
          <month>05</month>
          <day>09</day>
          <volume>19</volume>
          <issue>5</issue>
          <fpage>e151</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmir.org/2017/5/e151/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.6553</pub-id>
          <pub-id pub-id-type="medline">28487267</pub-id>
          <pub-id pub-id-type="pii">v19i5e151</pub-id>
          <pub-id pub-id-type="pmcid">PMC5442350</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
