<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="review-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v22i10e20346</article-id>
      <article-id pub-id-type="pmid">33090118</article-id>
      <article-id pub-id-type="doi">10.2196/20346</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Review</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Review</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>The Effectiveness of Artificial Intelligence Conversational Agents in Health Care: Systematic Review</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>McRoy</surname>
            <given-names>Susan</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Huang</surname>
            <given-names>Xiaolei</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Milne-Ives</surname>
            <given-names>Madison</given-names>
          </name>
          <degrees>BAS, MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7628-882X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>de Cock</surname>
            <given-names>Caroline</given-names>
          </name>
          <degrees>BSc, MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7585-9598</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Lim</surname>
            <given-names>Ernest</given-names>
          </name>
          <degrees>BSc, MBBS</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6972-0511</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Shehadeh</surname>
            <given-names>Melissa Harper</given-names>
          </name>
          <degrees>BSc, MSc, PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8955-0399</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>de Pennington</surname>
            <given-names>Nick</given-names>
          </name>
          <degrees>MA, BM BCh</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4536-4978</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Mole</surname>
            <given-names>Guy</given-names>
          </name>
          <degrees>BSc, MBBS, MSc</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9184-2531</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Normando</surname>
            <given-names>Eduardo</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5774-8082</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Meinert</surname>
            <given-names>Edward</given-names>
          </name>
          <degrees>MA, MSc, MBA, MPA, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <xref rid="aff7" ref-type="aff">7</xref>
          <address>
            <institution>Centre for Health Technology</institution>
            <institution>University of Plymouth</institution>
            <addr-line>8 Kirkby Place</addr-line>
            <addr-line>Room 2</addr-line>
            <addr-line>Plymouth, PL4 6DT</addr-line>
            <country>United Kingdom</country>
            <phone>44 7824446808</phone>
            <email>edward.meinert@plymouth.ac.uk</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2484-3347</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Digitally Enabled PrevenTative Health Research Group</institution>
        <institution>Department of Paediatrics</institution>
        <institution>University of Oxford</institution>
        <addr-line>Oxford</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Imperial College Healthcare NHS Trust</institution>
        <addr-line>London</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Ufonia Limited</institution>
        <addr-line>Oxford</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Institute of Global Health</institution>
        <institution>University of Geneva</institution>
        <addr-line>Geneva</addr-line>
        <country>Switzerland</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Oxford University Hospitals NHS Foundation Trust</institution>
        <addr-line>Oxford</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Department of Primary Care and Public Health</institution>
        <institution>Imperial College London</institution>
        <addr-line>London</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Centre for Health Technology</institution>
        <institution>University of Plymouth</institution>
        <addr-line>Plymouth</addr-line>
        <country>United Kingdom</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Edward Meinert <email>edward.meinert@plymouth.ac.uk</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>10</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>22</day>
        <month>10</month>
        <year>2020</year>
      </pub-date>
      <volume>22</volume>
      <issue>10</issue>
      <elocation-id>e20346</elocation-id>
      <history>
        <date date-type="received">
          <day>17</day>
          <month>5</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>8</day>
          <month>6</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>12</day>
          <month>6</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>2</day>
          <month>9</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Madison Milne-Ives, Caroline de Cock, Ernest Lim, Melissa Harper Shehadeh, Nick de Pennington, Guy Mole, Eduardo Normando, Edward Meinert. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 22.10.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://www.jmir.org/2020/10/e20346/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The high demand for health care services and the growing capability of artificial intelligence have led to the development of conversational agents designed to support a variety of health-related activities, including behavior change, treatment support, health monitoring, training, triage, and screening support. Automation of these tasks could free clinicians to focus on more complex work and increase the accessibility to health care services for the public. An overarching assessment of the acceptability, usability, and effectiveness of these agents in health care is needed to collate the evidence so that future development can target areas for improvement and potential for sustainable adoption.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This systematic review aims to assess the effectiveness and usability of conversational agents in health care and identify the elements that users like and dislike to inform future research and development of these agents.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>PubMed, Medline (Ovid), EMBASE (Excerpta Medica dataBASE), CINAHL (Cumulative Index to Nursing and Allied Health Literature), Web of Science, and the Association for Computing Machinery Digital Library were systematically searched for articles published since 2008 that evaluated unconstrained natural language processing conversational agents used in health care. EndNote (version X9, Clarivate Analytics) reference management software was used for initial screening, and full-text screening was conducted by 1 reviewer. Data were extracted, and the risk of bias was assessed by one reviewer and validated by another.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>A total of 31 studies were selected and included a variety of conversational agents, including 14 chatbots (2 of which were voice chatbots), 6 embodied conversational agents (3 of which were interactive voice response calls, virtual patients, and speech recognition screening systems), 1 contextual question-answering agent, and 1 voice recognition triage system. Overall, the evidence reported was mostly positive or mixed. Usability and satisfaction performed well (27/30 and 26/31), and positive or mixed effectiveness was found in three-quarters of the studies (23/30). However, there were several limitations of the agents highlighted in specific qualitative feedback.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The studies generally reported positive or mixed evidence for the effectiveness, usability, and satisfactoriness of the conversational agents investigated, but qualitative user perceptions were more mixed. The quality of many of the studies was limited, and improved study design and reporting are necessary to more accurately evaluate the usefulness of the agents in health care and identify key areas for improvement. Further research should also analyze the cost-effectiveness, privacy, and security of the agents.</p>
        </sec>
        <sec sec-type="registered-report">
          <title>International Registered Report Identifier (IRRID)</title>
          <p>RR2-10.2196/16934</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>artificial intelligence</kwd>
        <kwd>avatar</kwd>
        <kwd>chatbot</kwd>
        <kwd>conversational agent</kwd>
        <kwd>digital health</kwd>
        <kwd>intelligent assistant</kwd>
        <kwd>speech recognition software</kwd>
        <kwd>virtual assistant</kwd>
        <kwd>virtual coach</kwd>
        <kwd>virtual health care</kwd>
        <kwd>virtual nursing</kwd>
        <kwd>voice recognition software</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Conversational agents are among the many digital technologies being introduced into the health sector to address current health care challenges, such as shortages of health care providers, which reduce the availability and accessibility of health care services [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. Conversational agents use artificial intelligence (AI), including machine learning (a statistical means of training models with data so that they can make predictions based on a variety of features) and natural language processing (NLP; the ability to recognize and analyze verbal and written language) to interact with humans via speech, text, or other inputs and outputs on mobile, web-based, or audio-based platforms [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. Many of these agents are designed to use NLP so that users can speak or write to the agent as they would to a human. The agent can then analyze the input and respond appropriately in a conversational manner [<xref ref-type="bibr" rid="ref5">5</xref>].</p>
        <p>Conversational agents first emerged as a tool in health care in 1966, with the development of a virtual psychotherapist (ELIZA) that could provide predetermined answers to text-based user input [<xref ref-type="bibr" rid="ref6">6</xref>]. In the decades since, the capabilities of NLP have significantly progressed and aided the development of more advanced AI agents. Many different types of conversational agents that use NLP have been developed, including chatbots, embodied conversational agents (ECAs), and virtual patients, and are accessible by telephone, mobile phones, computers, and many other digital platforms [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref10">10</xref>]. The types of input that conversational agents can receive and interpret have also expanded, with some conversational agents capable of analyzing movements, such as gestures, facial expressions, and eye movements [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>].</p>
        <p>Conversational agents have been developed for many different aspects of the health sector to support health care professionals and the general public. Specific uses include screening for health conditions, triage, counseling, at-home health management support, and training for health care professionals [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref15">15</xref>]. With phone, mobile, and online platforms being widely accessible, conversational agents can support populations with limited access to health care or poor health literacy [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. They also have the potential to be affordably scaled up to reach large proportions of a population [<xref ref-type="bibr" rid="ref3">3</xref>]. Due to this accessibility, conversational agents are also a promising tool for the advancement of patient-centered care and can support users’ involvement in the management of their own health [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. Personalizable features have the potential to further improve usability and satisfaction, although more research is needed to evaluate their effectiveness in achieving their stated health outcomes and reducing costs and to ensure that there are no negative consequences for decision making or privacy [<xref ref-type="bibr" rid="ref10">10</xref>].</p>
        <p>Despite the large body of research concerning the application of conversational agents in health care, most reviews have limited their focus to a particular health area, agent type, or function [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref22">22</xref>]. Although there are a few recent systematic reviews that have examined a more comprehensive scope, they have presented an overall synthesis of the body of knowledge. One review developed a taxonomy that described the architecture and functions of conversational agents in health care and the state of the field but did not evaluate the effectiveness, usability, or implications for users [<xref ref-type="bibr" rid="ref5">5</xref>]. Another systematic review investigated the outcome measures of the studies of conversational agents but limited the inclusion criteria to agents that used natural language input and had been tested with human participants [<xref ref-type="bibr" rid="ref2">2</xref>]. Additionally, their initial database searches only retrieved 1531 articles, which raises the concern that some relevant articles may have been overlooked [<xref ref-type="bibr" rid="ref2">2</xref>]. Their search was updated in February 2018, but given the rapid pace of technological development, there is a need to provide an update and expansion to these previous systematic reviews.</p>
        <p>For conversational agents to be successful in health care, it is crucial to understand the effectiveness of current agents in achieving their intended outcomes. However, it is just as important to understand how users feel about and relate to these agents because the adoption of new health technologies depends on user perceptions (eg, whether they trust the technology, find it easy to use, and feel that privacy and data security are respected) [<xref ref-type="bibr" rid="ref23">23</xref>]. User-identified problems will need to be addressed if conversational agents are to have a significant impact on health care, because their impact depends on people being willing to use them and preferring to use them over alternatives. The information gathered in this review identifies the current issues with conversational agents that need to be overcome and can be used to help determine which elements of the agents are most likely to be successful and useful in various aspects of health care. As conversational agents are often touted as having the potential to reduce the burden on health care resources, evaluations of the implications of the agents for improved health care provision and reduced resource demand also need to be assessed.</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>The primary objectives of this review are to describe the scope of conversational agents currently being used for health care activities (by patients, health care providers, or the general public), examine the user perceptions of these agents, and evaluate their effectiveness. We developed 3 main research questions to address these objectives. First, are the conversational agents investigated effective at achieving their intended health-related outcomes, and does the effectiveness vary depending on the type of agent? Second, how do users rate the usability and satisfactoriness of the conversational agents, and what specific elements of the agents do they like and dislike? Finally, what are the current limitations and gaps in the utility of conversational agents in health care? These objectives build on previous systematic reviews while widening the scope of included studies to update the body of knowledge on conversational agents in health care and to inform future research and development.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Database Search</title>
        <p>The full methods for this review have been published in detail in a systematic review protocol [<xref ref-type="bibr" rid="ref24">24</xref>]. The population, intervention, comparison, and outcome framework [<xref ref-type="bibr" rid="ref25">25</xref>] was used to develop the search strategy, which was implemented following the PRISMA-P (Preferred Reporting Items for Systematic Review and Meta-Analyses Protocols) checklist [<xref ref-type="bibr" rid="ref26">26</xref>]. No study design filter was used; any type of study was eligible for inclusion. The search strategy was finalized and tailored to different databases in consultation with a medical librarian. PubMed, Medline (Ovid), EMBASE (Excerpta Medica dataBASE), CINAHL (Cumulative Index of Nursing and Allied Health Literature), Web of Science, and the Association for Computing Machinery Digital Library databases were searched. The search terms were grouped into 3 themes (conversational agents, health application, and outcome assessment) to capture all studies that fit the key inclusion criteria: evaluating conversational agents used in health care. These themes were subsequently searched with the structure: conversational agent (MeSH OR Keywords) AND health application (MeSH OR Keywords) AND outcome assessment (MeSH OR Keywords). The full search strategy can be found in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. The search was completed on November 29, 2019.</p>
      </sec>
      <sec>
        <title>Inclusion and Exclusion Criteria</title>
        <p>This systematic review aimed to assess conversational agents designed for health care purposes. Studies that evaluated at least 1 conversational agent were included. Studies targeting any population group, geographical location, and mental or physical health-related function (eg, screening, education, training, and self-management) were included. These broad inclusion criteria were established to enable an assessment of a wide range of applications of conversational agents. There were no restrictions on study type, as long as a conversational agent was evaluated, and intervention and observational studies such as cross-sectional surveys, cohort studies, and qualitative studies were included. Intervention studies were not required to have a specific comparator or any comparator.</p>
        <p>During the screening process, studies of conversational agents that were not capable of interacting with human users via unconstrained NLP were excluded. These included conversational agents that only allowed users to select from predefined options or agents with prerecorded responses that did not adapt to subsequent user responses. The basis for this exclusion is that, without the capability of using NLP, computational methods and technologies are rudimentary and do not advance the aims of AI for autonomous computational agents. As many studies did not explicitly state whether the investigated agent was capable of NLP, a description in the paper of the conversational agent allowing free-text or free-speech input was used as an indicator for NLP, and these studies were included. Studies that did not report the architecture of the agent were excluded.</p>
        <p>Due to the number of conversational agents in development and/or those that did not progress to the evaluation stages of development, studies that were solely descriptive were excluded. Furthermore, because of the pace at which conversational agents have developed over recent decades, studies were limited to those published during or after 2008. In 2008, the first iPhone was released, and it marks an increase in the prevalence and capabilities of digital technology. Only studies published in English were included to ensure accurate interpretation by the authors. Conference publications were also excluded from the review of peer-reviewed literature.</p>
      </sec>
      <sec>
        <title>Outcomes</title>
        <p>The primary objective of this review was to provide an overview of the use of NLP conversational agents in health care. Therefore, the primary outcomes evaluated were the effectiveness of conversational agents in achieving their intended health-related outcomes and user perceptions of the agents (including but not limited to acceptability, usability, satisfaction, and specific qualitative feedback). Secondary outcomes included improvement in health care provision and resource implications for the health care system.</p>
      </sec>
      <sec>
        <title>Screening and Study Selection</title>
        <p>All studies retrieved from the databases were stored in the reference management software EndNote (version X9, Clarivate Analytics), which automatically eliminated duplicates. Due to time constraints, the EndNote search function was used to extract relevant studies before the screening of the citations against the inclusion and exclusion criteria by 2 independent reviewers. Where duplicates or publications from the same study were identified, the more recent publication or the one with the most detail was selected for inclusion in the review. All disagreements were discussed, and if a consensus was not reached, a third reviewer was consulted. Full EndNote search details are shown in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
        <p>The full texts of the articles that met the inclusion criteria were screened by one of the reviewers. Of the screened articles deemed eligible for inclusion, 58 were conference or meeting abstracts and did not have full texts available; therefore, they were excluded. This highlights the early developmental stages of many of these agents.</p>
      </sec>
      <sec>
        <title>Data Extraction</title>
        <p>Data were extracted by 1 reviewer, and key data points from the studies, specified in the protocol and identified on further study of the publications, were recorded in a spreadsheet and validated by a second reviewer. The data extraction form was based on the minimum requirements recommended by the Cochrane Handbook for Systematic Reviews [<xref ref-type="bibr" rid="ref27">27</xref>]. The types of data extracted from the studies are shown in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Data extracted from the studies.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>Article information</td>
                <td>Data extracted</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>
                  General study information
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Title of publication</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Year of publication</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Authors</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  Study characteristics
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Study design</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Country of study</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Study population</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Analyzed sample size</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Comparators</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Study duration</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  Characteristics of the conversational agents
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Name of conversational agents</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Architecture</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Device or platform on which agent is accessed</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Intended user</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Primary purpose</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  Intended outcomes of the conversational agents
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Health objective (general)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Health objective (specific)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  Evaluation
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Effectiveness in achieving intended purpose</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Health literacy</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Improvement in health care provision</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Health care resource implications</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Usability</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Acceptability or satisfaction</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>User perceptions qualitative feedback</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Conclusions</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Implications for future study</p>
                    </list-item>
                  </list>
                </td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Risk-of-Bias and Quality Assessment</title>
        <p>All quality assessments were conducted by 2 independent reviewers, with disagreements resolved by consensus. If this was not possible, the opinion of a third reviewer was sought. As there was a wide variety of study designs, the study types were classified by 1 reviewer and validated by a second reviewer, with disagreements being resolved by discussion with a third reviewer. As the broad inclusion criteria were intended to capture all relevant studies, a few of the included studies used implementation models for artificial AI research that were beyond the scope of classic public health design methods. This resulted in some study designs being categorized as <italic>other</italic>.</p>
        <p>The Cochrane Collaboration risk-of-bias tool was used to evaluate the risk of bias in randomized controlled trials (RCTs) [<xref ref-type="bibr" rid="ref28">28</xref>]. The CASP (Critical Appraisal Skills Programme) tools for cohort and qualitative studies were used for the respective studies [<xref ref-type="bibr" rid="ref29">29</xref>], and the Appraisal tool for Cross-Sectional Studies (AXIS) tool was used to assess the quality of cross-sectional survey studies [<xref ref-type="bibr" rid="ref30">30</xref>]. Studies that were coded as <italic>other</italic> design types were also assessed using the AXIS tool, which was deemed to be the most rigorous and appropriate tool because it systematically evaluates elements of the introduction, methods, results, and discussion sections, and is not limited to the RCT-specific questions used in the risk-of-bias tool.</p>
        <p>The results of the Cochrane Collaboration risk-of-bias tool were summarized using RevMan 5.3. CASP and AXIS scores were calculated using yes=1, no=0, and cannot tell or do not know=0 for each question. The scores for each question were summed to provide a score for each study, which were averaged according to study type and are presented in the results.</p>
      </sec>
      <sec>
        <title>Data Analysis and Synthesis</title>
        <p>Due to the variability in populations, interventions, outcomes<italic>,</italic> and study designs, a meta-analysis of the studies was not possible. Therefore, we report a structured analysis of the findings to draw conclusions about the effectiveness and user perceptions of conversational agents in health care. For the purpose of this review, the agent was considered effective if there was a statistically significant (<italic>P</italic>&#60;.05) improvement in a given outcome as compared with a comparator or control, or over time. If no significance was reported or the difference was nonsignificant or significantly worse between groups or over time, the agent was considered to have no significant evidence supporting it. Limitations and future directions for research were also summarized.</p>
        <p>The synthesis framework for the assessment of health information technology (SF/HIT) was used to structure the evaluation of the studies because it included a whole system set of outcome variables [<xref ref-type="bibr" rid="ref31">31</xref>]. These included effectiveness, satisfaction, and perceived ease of use or usefulness, among others. In accordance with the framework, evidence for each of the outcome variables was coded as <italic>positive or mixed</italic> or <italic>neutral or negative</italic>. If the study did not address the outcome in question, it was coded as <italic>neutral or negative</italic>.</p>
        <p>Finally, where qualitative user feedback was reported by the studies, it was examined to extract common themes by extracting the sections of the original text that discussed the qualitative perceptions, reducing them to key themes, and then comparing those key themes across the different studies.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Included Studies</title>
        <p>Overall, 9441 studies were retrieved from the 6 databases, of which 2782 were duplicates. The reference management software EndNote was used for initial screening, with keywords based on the original search categories used to exclude studies that did not meet the criteria. After 6 passes, 957 citations remained for abstract screening. The primary reason for exclusion at the screening stage was that the study did not include an interactive, responsive conversational agent (n=470), was a review paper (n=65), was not health-related (n=48), or did not report any evaluation of the conversational agent (n=46). Of these 957 citations, 293 were selected for full-text review. In the final review, 31 papers were included. The reasons for exclusion after full-text review are detailed in <xref rid="figure1" ref-type="fig">Figure 1</xref>, with the most common reason being that the conversational agent did not use NLP (n=81), the full text was not available (n=71), or there was no conversational agent in the study (n=51).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Preferred Reporting Items for Systematic Review and Meta-Analyses flow diagram. NLP: natural language processing.</p>
          </caption>
          <graphic xlink:href="jmir_v22i10e20346_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Study Characteristics</title>
        <p>The characteristics of the 31 included studies are summarized in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref> [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref56">56</xref>]. Of these studies, 45% (14/31) evaluated conversational agents that had some type of audio or speech element. Of the agents, 45% (14/31) were chatbots (including 2 voice chatbots and 1 chatbot that also used a wizard), 19% (6/31) were ECAs (including 1 virtual doctor), and 10% (3/31) were interactive voice response (IVR) phone calls, virtual patients, and speech recognition screening systems. The final 2 comprised a contextual question-answering agent and a voice recognition triage system. In the 26 studies that reported the device that their conversational agent was used on; 35% (9/26) used computers, 27% (7/26) used web-based apps, 23% (6/26) used mobile phone apps, 15% (4/26) used telephone calls; 1 study used a tablet (the percentages do not add up to 100% because one agent could be used on a computer and also the telephone).</p>
        <p>There were a wide variety of areas of health care targeted by the conversational agents of the included studies. The largest proportion of them (12/31, 39%) addressed mental health issues [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref42">42</xref>], with 19% (6/31) providing some form of clinical decision or triage support [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref42">42</xref>-<xref ref-type="bibr" rid="ref44">44</xref>] and treatment support (including encouraging users to get screened) [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref45">45</xref>-<xref ref-type="bibr" rid="ref49">49</xref>], 10% (3/31) being used to support training of health care students [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref50">50</xref>] and the screening or diagnosis of users [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref51">51</xref>], 7% (2/31) targeting physical health [<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref53">53</xref>] and layperson medical education [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>]; 1 agent was designed to help monitor users’ speech [<xref ref-type="bibr" rid="ref56">56</xref>]. The percentages do not add up to 100% because some of the studies that addressed mental health also fit into one of the other categories.</p>
        <p>The study designs also varied widely, with 29% (9/31) using cross-sectional designs, 26% (8/31) using RCTs, 23% (7/31) using qualitative methods, 19% (6/31) using cohort studies, and 1 using a cluster crossover design. The full data extraction table is available in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref> [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref56">56</xref>].</p>
      </sec>
      <sec>
        <title>Overall Evaluation of Conversational Agents</title>
        <p>Overall, about three-quarters of the studies (22/30, 73%) reported positive or mixed results for most of the outcomes. A total of 8 studies were coded as reporting positive or mixed evidence for 10 or more of the 11 outcomes specified in the SF/HIT; the analysis for this review was limited to the interpretation of impact as reported by study authors to reflect evaluation outcomes. Excluding 1 study, which was an acceptability study only and did not assess the other outcomes, the average number of outcomes that were coded as <italic>positive or mixed</italic> was 67% (7.4/11, SD 2.5). However, the number of outcomes met per study ranged from 1/11 to 11/11 (9-100%). Perceived ease of use or usefulness (27/30, 90%), the process of service delivery or performance (26/30, 87%), appropriateness (24/30, 80%), and satisfaction (26/31, 84%) were the outcomes that had the most support from the studies. Just over three-quarters (23/30, 77%) of the studies also reported positive or mixed evidence of effectiveness.</p>
        <p>However, very few studies discussed the cost-effectiveness (5/30, 17%, coded as <italic>positive or mixed</italic>) or safety, privacy, and security (14/30, 47%, coded as <italic>positive or mixed</italic>) outcomes for the agents being evaluated. About a quarter of studies (8/30, 27%) had neither positive nor mixed reported evidence for more than half of the SF/HIT outcomes. The evaluation of the SF/HIT outcomes is summarized in <xref ref-type="table" rid="table2">Table 2</xref> [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Summary of the studies based on the evaluation outcomes from the synthesis framework for the assessment of health information technology<sup>a</sup>.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="110"/>
            <col width="70"/>
            <col width="90"/>
            <col width="60"/>
            <col width="90"/>
            <col width="70"/>
            <col width="60"/>
            <col width="70"/>
            <col width="90"/>
            <col width="80"/>
            <col width="80"/>
            <col width="60"/>
            <col width="70"/>
            <thead>
              <tr valign="top">
                <td>First author (reference)</td>
                <td>Preventive care</td>
                <td>Adherence or attendance</td>
                <td>Efficiency</td>
                <td>Perceived ease of use or usefulness</td>
                <td>Effectiveness</td>
                <td>Performance</td>
                <td>Safety or privacy or security</td>
                <td>Acceptability</td>
                <td>Cost-effectiveness</td>
                <td>Appropriateness</td>
                <td>Satisfaction</td>
                <td>n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Adams [<xref ref-type="bibr" rid="ref9">9</xref>]</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>10 (91)</td>
              </tr>
              <tr valign="top">
                <td>Bibault [<xref ref-type="bibr" rid="ref46">46</xref>]</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>10 (91)</td>
              </tr>
              <tr valign="top">
                <td>Borja-Harta [<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>7 (64)</td>
              </tr>
              <tr valign="top">
                <td>Cameron [<xref ref-type="bibr" rid="ref32">32</xref>]</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>5 (45)</td>
              </tr>
              <tr valign="top">
                <td>Chaix [<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>8 (73)</td>
              </tr>
              <tr valign="top">
                <td>Chang [<xref ref-type="bibr" rid="ref8">8</xref>]</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>7 (64)</td>
              </tr>
              <tr valign="top">
                <td>Crutzen [<xref ref-type="bibr" rid="ref54">54</xref>]</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>9 (82)</td>
              </tr>
              <tr valign="top">
                <td>Dimeff [<xref ref-type="bibr" rid="ref42">42</xref>]</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>10 (91)</td>
              </tr>
              <tr valign="top">
                <td>Elmasri [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>5 (45)</td>
              </tr>
              <tr valign="top">
                <td>Fitzpatrick [<xref ref-type="bibr" rid="ref13">13</xref>]</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>10 (91)</td>
              </tr>
              <tr valign="top">
                <td>Friederichs [<xref ref-type="bibr" rid="ref53">53</xref>]</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>4 (36)</td>
              </tr>
              <tr valign="top">
                <td>Fulmer [<xref ref-type="bibr" rid="ref34">34</xref>]</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>6 (55)</td>
              </tr>
              <tr valign="top">
                <td>Galescu [<xref ref-type="bibr" rid="ref52">52</xref>]</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>3 (27)</td>
              </tr>
              <tr valign="top">
                <td>Ghosh [<xref ref-type="bibr" rid="ref44">44</xref>]</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>9 (82)</td>
              </tr>
              <tr valign="top">
                <td>Havik [<xref ref-type="bibr" rid="ref14">14</xref>]</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>10 (91)</td>
              </tr>
              <tr valign="top">
                <td>Heyworth [<xref ref-type="bibr" rid="ref47">47</xref>]</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>8 (73)</td>
              </tr>
              <tr valign="top">
                <td>Hudlicka [<xref ref-type="bibr" rid="ref35">35</xref>]</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>11 (100)</td>
              </tr>
              <tr valign="top">
                <td>Inkster [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>9 (82)</td>
              </tr>
              <tr valign="top">
                <td>Ireland [<xref ref-type="bibr" rid="ref56">56</xref>]</td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>1</td>
                <td>1 (100)</td>
              </tr>
              <tr valign="top">
                <td>Isaza- Restrepo [<xref ref-type="bibr" rid="ref15">15</xref>]</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>10 (91)</td>
              </tr>
              <tr valign="top">
                <td>Ly [<xref ref-type="bibr" rid="ref37">37</xref>]</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>5 (45)</td>
              </tr>
              <tr valign="top">
                <td>Nakagawa [<xref ref-type="bibr" rid="ref12">12</xref>]</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>7 (64)</td>
              </tr>
              <tr valign="top">
                <td>Philip (2014) [<xref ref-type="bibr" rid="ref51">51</xref>]</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>10 (91)</td>
              </tr>
              <tr valign="top">
                <td>Philip (2017) [<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>9 (82)</td>
              </tr>
              <tr valign="top">
                <td>Rhee [<xref ref-type="bibr" rid="ref48">48</xref>]</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>9 (82)</td>
              </tr>
              <tr valign="top">
                <td>Simon [<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>7 (64)</td>
              </tr>
              <tr valign="top">
                <td>Spänig [<xref ref-type="bibr" rid="ref43">43</xref>]</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>6 (55)</td>
              </tr>
              <tr valign="top">
                <td>Washburn [<xref ref-type="bibr" rid="ref41">41</xref>]</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>5 (45)</td>
              </tr>
              <tr valign="top">
                <td>Wong [<xref ref-type="bibr" rid="ref55">55</xref>]</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>1 (9)</td>
              </tr>
              <tr valign="top">
                <td>Xu [<xref ref-type="bibr" rid="ref40">40</xref>]</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>5 (45)</td>
              </tr>
              <tr valign="top">
                <td>Yasavur [<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>1</td>
                <td>0</td>
                <td>0</td>
                <td>1</td>
                <td>0</td>
                <td>1</td>
                <td>1</td>
                <td>7 (64)</td>
              </tr>
              <tr valign="top">
                <td>n (%)</td>
                <td>17 (57)</td>
                <td>19 (63)</td>
                <td>22 (73)</td>
                <td>27 (90)</td>
                <td>23 (77)</td>
                <td>26 (87)</td>
                <td>14 (47)</td>
                <td>20 (67)</td>
                <td>5 (17)</td>
                <td>24 (80)</td>
                <td>26 (84)</td>
                <td>
                  <break/>
                </td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>Positive or mixed results have been coded as 1, and neutral or negative results as 0.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>When grouped by the agent’s health care scope, studies of certain types of agents appear to do better than others (<xref ref-type="table" rid="table3">Table 3</xref>). Studies examining screening or diagnosis agents and treatment support agents had the highest average number of positive or mixed outcomes (mean 10, SD 0.6, and mean 9, SD 1.2, respectively). Treatment support agents had primary functions that included empowering patients to engage more fully in clinical appointments, encouraging attending screenings for health care conditions, and supporting patient self-management. In contrast, mental health agents focused on addressing challenges related to depression, anxiety, and alcohol abuse, among others. However, given the small number of studies for each category of agents, these comparisons should be interpreted with caution.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Summary of evaluation outcomes by the area of health care addressed by the conversational agent<sup>a</sup>.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="370"/>
            <col width="170"/>
            <col width="280"/>
            <col width="180"/>
            <thead>
              <tr valign="top">
                <td>Agent focus</td>
                <td>Number of studies</td>
                <td>Average number of outcomes coded <italic>positive or mixed</italic>, n (%)</td>
                <td>Range of scores (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Mental health [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref42">42</xref>]</td>
                <td>12</td>
                <td>7 (66)</td>
                <td>5-11 (2.4)</td>
              </tr>
              <tr valign="top">
                <td>Clinical decision or triage support [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref42">42</xref>-<xref ref-type="bibr" rid="ref44">44</xref>]</td>
                <td>6</td>
                <td>7 (67)</td>
                <td>5-10 (1.9)</td>
              </tr>
              <tr valign="top">
                <td>Treatment support [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref45">45</xref>-<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                <td>6</td>
                <td>9 (79)</td>
                <td>7-10 (1.2)</td>
              </tr>
              <tr valign="top">
                <td>Health care training (students) [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                <td>3</td>
                <td>7 (67)</td>
                <td>5-10 (2.5)</td>
              </tr>
              <tr valign="top">
                <td>Screening or diagnosis [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref51">51</xref>]</td>
                <td>3</td>
                <td>10 (88)</td>
                <td>9-10 (0.6)</td>
              </tr>
              <tr valign="top">
                <td>Health care education (laypeople) [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>]</td>
                <td>2</td>
                <td>5 (45)</td>
                <td>1-9 (5.7)</td>
              </tr>
              <tr valign="top">
                <td>Physical health [<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref53">53</xref>]</td>
                <td>2</td>
                <td>4 (32)</td>
                <td>3-4 (0.7)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>The number of studies does not add up to 31 because some studies fit into 2 categories, and the study on monitoring speech was not included because it only addressed 1 of the 11 outcomes. The percentages associated with the average number of outcomes varied slightly because of rounding.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Qualitative User Perceptions</title>
        <p>A total of 18 of the 31 studies included more specific user feedback. The most frequently raised issue with conversational agents (9 studies) was poor understanding because of limited vocabulary, voice recognition accuracy, or error management of word inputs [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref52">52</xref>]. Related to this issue, as the conversational agents often had to ask questions more than once to be able to process the response, users in 3 studies noted disliking the repetitive conversations with the agents [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. Both of these issues are key areas of improvement for future research and development of conversational agents because they represent limitations in the usability of the agents in a real-world context.</p>
        <p>Feedback from users in 5 studies expressed a preference for interactivity, with users in 1 study noting that they liked the interactivity of the chatbot [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref37">37</xref>], and users in the other 4 studies expressed a desire for greater interactivity or relational skills in the conversational agent [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref53">53</xref>]. Similarly, users in 4 studies reported liking that the agent had a personality and/or showed empathy [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref42">42</xref>], whereas users in other studies reported disliking the lack of personal connection or had difficulty in empathizing with the agent [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref50">50</xref>] or reported disliking its limited conversation and responses [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref56">56</xref>].</p>
        <p>Due to the wide variety of conversational agents, their aims and health care contexts, much of the qualitative user perception data concerned distinct aspects of the agents. However, several studies reported feedback concerned with customization or availability of feature options, with 2 studies commenting on it positively (eg, having both voice and touch modes to allow hands-free work and rapid data input on a triage system for nurses) [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref35">35</xref>], and 3 studies desiring more features and more control [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref48">48</xref>]. Additionally, users in 2 studies suggested that better integration of the agent with electronic health record (EHR) systems (for a virtual doctor [<xref ref-type="bibr" rid="ref42">42</xref>]) or health care providers (for an asthma self-management chatbot [<xref ref-type="bibr" rid="ref48">48</xref>]) would be useful.</p>
        <p>Other features of the agents that users reported liking were the reminders and assistance in forming routines [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref48">48</xref>] and that the agents provided accountability [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref48">48</xref>], facilitated learning [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref37">37</xref>], and were easy to learn and use [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. In the included studies, 3 of the conversational agents were virtual patients, and users in all 3 studies reported liking that it provided a platform for risk-free learning because they were not practicing on real patients [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref50">50</xref>].</p>
        <p>Several studies reported user feedback that was specific to that conversational agent. This included a preference for telephone IVR over web-based pediatric care guidance [<xref ref-type="bibr" rid="ref9">9</xref>] and a simple avatar with a computer-generated voice over a more life-like agent with a recorded voice [<xref ref-type="bibr" rid="ref42">42</xref>]. Users in 1 study reported liking that the agent initiated conversations [<xref ref-type="bibr" rid="ref37">37</xref>]. There was opposite feedback in 2 studies about the format of the response, with users preferring preformatted options for one chatbot [<xref ref-type="bibr" rid="ref36">36</xref>], whereas some users preferred the free-text responses for a diagnostic chatbot because it allowed them to provide contextual information. In contrast, others found it more difficult to know how to respond so the agent would understand [<xref ref-type="bibr" rid="ref14">14</xref>].</p>
        <p>Other agent-specific negative feedback was that the virtual doctor did not have the ability to go deep enough or provide access to other materials [<xref ref-type="bibr" rid="ref42">42</xref>], that too much information was provided [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref33">33</xref>] or the interaction was too long [<xref ref-type="bibr" rid="ref13">13</xref>], the use of nonverbal expressions by the avatar [<xref ref-type="bibr" rid="ref35">35</xref>], and a lack of clarity regarding the aim of the chatbot [<xref ref-type="bibr" rid="ref37">37</xref>]. Some students who used the virtual patients also reported that it was difficult to empathize [<xref ref-type="bibr" rid="ref50">50</xref>] and that the agent did not sufficiently encompass real situational complexity [<xref ref-type="bibr" rid="ref15">15</xref>]. The variety of specific feedback reports demonstrates the importance of examining usability for individual conversational agents and tailoring the design to the intended population. Although there were some preferences and complaints that were frequently reported, much of the feedback was agent dependent. A summary of the thematic analysis is included in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>.</p>
      </sec>
      <sec>
        <title>Implications for Health Care Provision and Resources</title>
        <p>Unfortunately, only a few of the studies discussed any improvement in health care provision or implications for resources; 2 of the studies that suggested improvement in health care provision were evaluating virtual patients [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref50">50</xref>], and students in 1 study reported significantly increased confidence in their clinical skills and ability to interview patients. Over 80% of users also reported that the agents helped them follow their treatment more effectively [<xref ref-type="bibr" rid="ref45">45</xref>] and be more prepared for pediatric visits [<xref ref-type="bibr" rid="ref9">9</xref>]. In a study of an ECA for sleep disorder screening, 65% of users reported thinking that the agent could provide significant assistance to physicians [<xref ref-type="bibr" rid="ref51">51</xref>]. Regarding resource implications, the study of a preparatory IVR phone call before pediatric visits found that visit time was significantly reduced in the IVR group compared with the control group [<xref ref-type="bibr" rid="ref9">9</xref>]. The use of an ECA to screen for depression [<xref ref-type="bibr" rid="ref38">38</xref>] and a virtual doctor for suicidal patients in emergency departments (EDs) [<xref ref-type="bibr" rid="ref42">42</xref>] were suggested by the authors to save physicians’ time and reduce the costs associated with ED visits for suicidal ideation, but these outcomes were not evaluated. Similarly, another study suggested that mindfulness meditation could be of more use with more cost-effective training made available via a virtual coach [<xref ref-type="bibr" rid="ref35">35</xref>].</p>
        <p>Suggestions such as this, that conversational agents have the potential to improve health care provision, save health care providers’ time, and reduce costs, were frequently made in the studies. However, as demonstrated above, very few studies quantified these claims and even fewer measured these outcomes with objective measures. This is a limitation of the studies as a whole. Although many were in the early stages of testing, claims about the potential value to the health care system in terms of time or money should be substantiated. However, as evidenced by the number of <italic>neutral or negative</italic> coding in the evaluation, many of the studies did not consider whole system implementation outcomes. It will be important for the future development of conversational agents to consider outcomes such as these from the beginning so that agents that are not only acceptable and usable but also provide value to the health care system can be built.</p>
      </sec>
      <sec>
        <title>Risk-of-Bias and Quality Assessments</title>
        <p>There were a variety of study types included in this review; so several different quality assessment tools were used to assess the risk of bias and quality of the 31 included studies. A total of 6 studies could not be classified as RCTs, cohort, qualitative, or cross-sectional studies, and their study design was coded as <italic>other</italic> [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref55">55</xref>]. Most of these studies were papers describing the development and initial evaluation of conversational agents, and half of them did not have participants [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref55">55</xref>]. Initially, studies that did not have an explicit design were classified as qualitative or interpretative studies. However, on further analysis, many of the studies did not fit the criteria for qualitative studies - evaluating subjective, thematic, and non-numerical data - because they evaluated performance metrics such as word error rates [<xref ref-type="bibr" rid="ref52">52</xref>], accuracy [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref55">55</xref>], precision [<xref ref-type="bibr" rid="ref44">44</xref>], and user experience quantified on Likert scales [<xref ref-type="bibr" rid="ref39">39</xref>]. Therefore, these studies were coded as <italic>other</italic> and assessed using the AXIS tool for cross-sectional studies, which was deemed to provide the most systematic evaluation of the various elements of the studies [<xref ref-type="bibr" rid="ref30">30</xref>]. The quality of these studies was assessed as best as possible; however, the judgments should be considered in the context of these limitations.</p>
        <p>Overall, the quality of the studies was poor to moderate. On average, RCTs [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref53">53</xref>] and qualitative studies [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref56">56</xref>] evaluated were generally determined to have the highest quality and lowest risk of bias, with none of the other 3 study types meeting more than half the criteria for quality assessment. The evaluation of the risk of bias for the 8 RCTs (<xref rid="figure2" ref-type="fig">Figure 2</xref>) was carried out using the Cochrane Collaboration risk-of-bias tool [<xref ref-type="bibr" rid="ref28">28</xref>], and the results were summarized using RevMan 5.3 software (Cochrane) [<xref ref-type="bibr" rid="ref57">57</xref>]. Overall, the RCTs performed fairly well in the risk-of-bias assessment (<xref rid="figure3" ref-type="fig">Figure 3</xref>). About half the studies were assessed as having a low risk of selection bias because of proper random sequence generation (5/8) and allocation concealment (4/8), and a low risk of reporting bias (4/8), as outcomes reported could be compared with a priori protocols or trial registrations. Most studies reported blinding of outcome assessors (7/8) and a low risk of attrition bias because of low or equal dropout across groups or the use of intention-to-treat analyses (6/8). Most of the studies (5/8) had a high risk of performance bias, but this was predominantly because blinding was not possible given the nature of the intervention.</p>
        <p>The cohort (n=9) and qualitative (n=3) studies assessed using the CASP checklists met, on average, 5/12 (range 1-10) and 7/10 (range 4-9) criteria, respectively [<xref ref-type="bibr" rid="ref29">29</xref>]. Of the cohort studies, the questions with the best performance were, “Did the study address a clearly focused issue?” (8/9 yes), “Was the follow up long enough?” (8/9 yes), and “Do the results of this study fit with other available evidence?” (6/9 yes). Studies performed the worst, either by failing to meet the criteria or failing to report it, on questions about cohort recruitment (1/9 yes), identifying and accounting for confounding factors (1/9 yes), accurate exposure and outcome measurement (2/9 and 3/9 yes, respectively), and the applicability of results to the local population (3/9 yes). The qualitative studies, on the other hand, performed best on the questions about whether the qualitative methodology was appropriate, the consideration of ethical issues, clear statements of findings, and whether the results would help locally (3/3 yes for each). None of the 3 studies reported any consideration of the relationship between researcher and participant. They also performed poorly on questions about sample recruitment, data collection, and data analysis (1/3 yes for each).</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Risk of bias summary: review authors' judgements about each risk of bias item for each included study.</p>
          </caption>
          <graphic xlink:href="jmir_v22i10e20346_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Risk of bias graph: review authors' judgements about each risk of bias item presented as percentages across all included studies.</p>
          </caption>
          <graphic xlink:href="jmir_v22i10e20346_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>The cross-sectional (n=5) and <italic>other</italic> (n=6) studies assessed using the AXIS tool met, on average, 50% (range 26-80%) and 42% (range 29-70%) of the criteria, respectively [<xref ref-type="bibr" rid="ref30">30</xref>]. Percentages are reported instead of the exact number of criteria because several of the questions were not applicable to the studies; so the total number of criteria assessed per study was not the same (averages 19 and 16; ranges 18-20, and 10-19, respectively). Overall, the cross-sectional studies performed best on questions about the clarity of aims (5/5 yes), appropriate outcome variables for the aims (5/5 yes), internal consistency (5/5 yes), and adequate description of basic data (4/5 yes). They performed worst on questions about sample selection—whether it was taken from an appropriate base to represent the population (1/5 yes) and whether the process was likely to select a representative sample (0/5 yes)—the use of appropriate outcome measures (previously assessed; 0/5 yes), whether the methods were adequately described for replication (1/5 yes), and conflicts of interest (1/5 no, most did not report).</p>
        <p>The <italic>other</italic> studies performed best on the questions about whether the study design was appropriate for the aims and whether the conclusions were justified by the results (6/6 yes for both). They also did well, overall, on the appropriate choice of outcome variables and internal consistency (5/6 yes for both). However, all the <italic>other</italic> studies for which the questions were applicable performed poorly on questions about the justification of sample size (0/5 yes), whether the selection process was likely to get a representative sample (0/5 yes), addressing nonresponders (0/2 yes), adequate description of basic data (0/4 yes), concerns about nonresponse bias (0/3 no), the presentation of results for all the analyses described in the methods (0/6 yes, although this was mostly because analyses were not adequately described in the methods), and conflicts of interest (0/6 no, again because nothing was reported). Furthermore, only 1 study adequately addressed the questions about the use of previously assessed outcome measures (1/5 yes), sufficient description of the methods for replication (1/6 yes), and discussion of study limitations (1/6 yes). It should be noted that the AXIS tool used to assess the <italic>other</italic> studies was designed for cross-sectional studies and does not fit exactly with the designs of these studies. Therefore, it is possible that these studies would perform better when assessed by a tool specific to their study type. Tables depicting the judgments for each question of the CASP cohort and qualitative checklists and the AXIS tool for the cross-sectional and <italic>other</italic> studies are included in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendices 6</xref>-<xref ref-type="supplementary-material" rid="app9">9</xref> [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref38">38</xref>-<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref50">50</xref>-<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref54">54</xref>-<xref ref-type="bibr" rid="ref56">56</xref>].</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>In this systematic review, we examined 31 studies that evaluated the effectiveness and usability of conversational agents in health care. Overall, studies reported a moderate amount of evidence supporting the effectiveness, usability, and positive user perceptions of the agents. On average, two-thirds of the studies (67%) reported positive or mixed evidence for each evaluation outcome. However, this ranged significantly, with usability, agent performance, and satisfaction having the most support across the studies, and cost-effectiveness receiving hardly any support. It should also be noted that the definitions of <italic>effectiveness</italic> were highly varied and, as evidenced by the methodological limitations identified in the quality assessment, rarely evaluated with the scrutiny expected for medical devices. Although the results reported are promising for the use of conversational agents in health care, there are a number of limitations in both the studies analyzed and the structure of this review that questions the validity of this finding.</p>
        <p>With regard to qualitative user perceptions of the agents, specific feedback was very mixed. Users highlighted many positive factors of the agents, particularly their personality and ability to provide empathy and emotional support, that they support learning, they are easy to use and access, and they help them be accountable, all of which support the generally positive evaluations of usability and satisfaction outcomes. However, there were a number of limitations of the agents that were consistently raised across the studies that reported qualitative feedback. These included the following: the agents had difficulty understanding them, the agents were repetitive and not sufficiently interactive, and the users had difficulty forming personal connections with the agents. This suggests that despite the generally positive usability reported by the studies, there are a number of barriers to the successful use of conversational agents in health care that will need to be addressed before they can achieve the greatest impact. It should be noted that this review only included studies of conversational agents that used NLP and that free-text inputs are likely to present greater difficulties for comprehension.</p>
        <p>The results of this systematic review are largely consistent with the literature, particularly the previous systematic review evaluating conversational agents in health care [<xref ref-type="bibr" rid="ref2">2</xref>]. They also found a limited quality of design and evidence in the included studies, with inconsistent reporting of study methods (including methods of selection, attrition, and a lack of validated outcome measures) and conflicts of interest [<xref ref-type="bibr" rid="ref2">2</xref>]. The previous systematic review identified that high-quality evidence of effectiveness and patient safety was limited, which was also observed in this review. Similarly, it noted that high overall satisfaction was generally reported by the studies, but that the most common issues with conversational agents related to language understanding or poor dialogue management, which is consistent with our findings [<xref ref-type="bibr" rid="ref2">2</xref>]. Some of this similarity in results is likely because of the overlap in included studies; 7 of their 17 included studies were also included in our review [<xref ref-type="bibr" rid="ref2">2</xref>].</p>
      </sec>
      <sec>
        <title>Quality of the Evidence</title>
        <p>As noted in a previous systematic review [<xref ref-type="bibr" rid="ref2">2</xref>], there were significant issues with the quality of many of the included studies. One of the consistent issues among many of them was a high risk of selection bias. A large proportion of the studies relied on volunteers for the study, many of whom were recruited via self-selection means such as flyers and emails or by downloading the app being studied. The risk with self-selection recruitment is that participants who elect to take part in the study are already more positively predisposed to new technologies than those who do not participate, and would tend to evaluate the technology more positively. To make matters worse, several of the studies also did not sufficiently report their recruitment strategies, and so their potential selection bias cannot be accurately evaluated. In research such as this, where user perceptions are a main outcome, this is a serious concern. Future studies should take care to implement recruitment strategies that minimize this risk of selection bias or balance the potential bias in evaluations by actively recruiting participants who are less inclined toward new technology.</p>
        <p>Another limitation of many of the studies was the small sample size. Almost two-thirds of the studies (19/31) used samples of less than 100 participants or items of analysis (eg, voice clips and clinical scenarios) with a median sample size of 48 across all the studies. Many also did not sufficiently report demographic data or whether their sample was representative of their target population. Although many of these studies were early feasibility and usability trials, this is an important issue to address in future research testing these agents to determine whether an agent will be used and used effectively by its target population.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>The validity of the evidence extracted from the included studies was also affected by limitations in the structure of this review. The SF/HIT was used to provide a structured set of whole system implementation outcomes to evaluate the conversational agents [<xref ref-type="bibr" rid="ref31">31</xref>]. However, an issue with the use of this framework, which was discovered during analysis, was that many of the included studies were describing system innovation. Therefore, they did not address or provide evidence for many of the outcomes described by the SF/HIT. Additionally, as the included data indicated a self-reported impact in the studies of effectiveness, the study effectiveness is biased favorably toward the authors’ reporting of impact.</p>
        <p>This limitation in the use of the framework for this review also highlights a limitation in many of these studies, namely, that they do not think about whole system implementation from the early stages of agent design, development, and testing. It is possible that the lack of evaluation of the implications of the agents for health care provision and resources was because of an emphasis on technology development and evaluation, rather than system integration. This is a pervasive issue in technological innovation, so much that it drove the development of the nonadoption, abandonment, scale-up, spread, and sustainability framework as a means of predicting and assessing the success of new health technologies [<xref ref-type="bibr" rid="ref58">58</xref>] and the development and evaluation of new conversational agents to ensure that these later-stage implications of health care provision, cost-effectiveness, and privacy and security are sufficiently considered from the early stages of innovation. They must also be properly evaluated with a large sample of users, rather than be simply presented as unsubstantiated claims that the agent will reduce costs and save health care providers’ time.</p>
        <p>Additionally, in accordance with the SF/HIT framework, the impact of outcomes on each outcome was coded as <italic>positive or mixed</italic> or <italic>neutral or negative</italic>. However, this combination of positive and mixed outcomes reduces the granularity of the results. During the coding process, several outcomes were distinctly coded as <italic>positive or mixed</italic>, and collating the 2 outcome impacts into 1 reduces the precision of the information presented to the readers. Additionally, studies that did not assess the outcome in question were coded as <italic>neutral or negative</italic> because they did provide explicit support for the outcome. In the analysis, outcomes were initially coded separately as positive, mixed, positive or mixed (for studies that reported a positive outcome but did not provide sufficient statistical evidence), and neutral or negative. This table is available in <xref ref-type="supplementary-material" rid="app10">Multimedia Appendix 10</xref>. Positive and mixed outcomes were combined for the final presentation of the data in line with the framework. However, it might be more useful to distinguish between studies that attempted to find significant evidence for an outcome but did not and those that did not attempt it. This would provide a clearer picture of which outcomes are not being supported by the evidence and should be targeted for improvement, and which outcomes still need to be examined. In the future, it would be worth evaluating whether the coding system should be adjusted to provide a more detailed and informative summary of the evidence.</p>
        <p>Further limitations of this review are that we limited the focus to include only unconstrained NLP and interaction. This was chosen as a focus because of the advantages NLP offers for simulating human-to-human interaction. However, it may have excluded studies of relevant conversational agents that could be satisfactory, useful, and effective in addressing current health care challenges. Additionally, no spidering searches were used to identify potentially relevant studies in the references of the included studies that were missed in the initial search. The exclusion of conference abstracts might also have caused relevant papers that were classified as abstracts to be missed; however, a previous systematic review that included conference abstracts in their search only had 1 included in their final selection [<xref ref-type="bibr" rid="ref2">2</xref>]. The inclusion of only studies published in English is also likely to exclude relevant research on conversational agents conducted in other countries. These limitations should be addressed in future studies to ensure that the full body of relevant literature is examined.</p>
      </sec>
      <sec>
        <title>Future Directions</title>
        <p>Future reviews of conversational agents in health care could be extended to include constrained NLP and non-NLP conversational agents. A synthesis of the evidence identified here with other types of conversational agents in health care, perhaps structured according to the taxonomy suggested by Montenegro et al [<xref ref-type="bibr" rid="ref5">5</xref>], could be used to examine overall trends and provide a better picture of what is being used, what works, and what does not, to further guide the development of conversational agents that are most likely to be successful.</p>
        <p>Future research should also include more qualitative evaluations of the features that users like and dislike. Only half (18/31) of the studies included in this review reported specific user feedback, despite the fact that 7 of the remaining 13 studies included some measure of usability or user perceptions. It will be important to identify all of the structural, physical, and psychological barriers to use if conversational agents are to achieve their potential for improving health care provision and reducing the strain on health care resources. To this end, it would be useful for future studies to structure their evaluation of conversational agents around a behavioral change framework (eg, the Behavior Change Wheel framework [<xref ref-type="bibr" rid="ref59">59</xref>]). This is important not only when evaluating the effectiveness of behavior change-focused conversational agents, but also when determining whether and how the adoption of new conversational agent technology will be successful.</p>
        <p>It will be important for future studies of conversational agents to take care to properly structure and report their studies to improve the quality of the evidence. Without high-quality evidence, it is difficult to assess the current state of conversational agents in health care - what is working, and what needs to be improved to make them a more useful tool. Similarly, there is a gap in the evidence regarding the health economics of these agents. Very few studies in this review even discussed the cost analysis of the agent in questions, let alone provide substantive evidence about its cost-effectiveness. The evaluation of costs and outcomes of new technologies and their privacy, security, and interoperability will be necessary to advance value-based health care [<xref ref-type="bibr" rid="ref60">60</xref>]. However, there is very little evidence to suggest that the conversational agents examined in this review considered or addressed these concerns. User feedback on 2 of the studies even noted that better interoperability between the agent and EHRs or health care providers would improve its usefulness.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>The objective of this systematic review was to synthesize evidence of conversational agents’ usability, effectiveness, and satisfaction in health care. Although the studies generally reported positive outcomes relating to the agents’ usability and effectiveness, the quality of the evidence was not sufficient to provide strong evidence to support these claims. This study extended the literature by expanding its summary to examine a whole system set of evaluation outcomes, including cost-effectiveness, privacy, and security, which have not been systematically examined in previous reviews. In addition, it provides a distinct contribution by conducting a thematic analysis of the qualitative user perceptions of the agents. Further research is needed to examine the cost-effectiveness and value of these agents in health care, both in their current and potential states. Higher-quality studies—with more consistent reporting of design methods and better sample selection—are also needed to more accurately assess the usefulness and identify the key areas of improvement for current conversational agents. A more holistic approach to the design, development, and evaluation of conversational agents will help drive innovation and improve their value in health care.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Search queries and number of results for each database.</p>
        <media xlink:href="jmir_v22i10e20346_app1.docx" xlink:title="DOCX File , 16 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>EndNote search details.</p>
        <media xlink:href="jmir_v22i10e20346_app2.docx" xlink:title="DOCX File , 12 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Summary of study characteristics.</p>
        <media xlink:href="jmir_v22i10e20346_app3.docx" xlink:title="DOCX File , 27 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Data extraction table.</p>
        <media xlink:href="jmir_v22i10e20346_app4.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 166 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Summary of the thematic analysis of qualitative user feedback.</p>
        <media xlink:href="jmir_v22i10e20346_app5.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 112 KB"/>
      </supplementary-material>
      <supplementary-material id="app6">
        <label>Multimedia Appendix 6</label>
        <p>Summary of the quality assessment and judgments of cohort studies using the CASP (Critical Appraisal Skills Programme) Cohort Study Checklist.</p>
        <media xlink:href="jmir_v22i10e20346_app6.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 17 KB"/>
      </supplementary-material>
      <supplementary-material id="app7">
        <label>Multimedia Appendix 7</label>
        <p>Summary of the quality assessment and judgments of qualitative studies using the CASP (Critical Appraisal Skills Programme) Qualitative Study Checklist.</p>
        <media xlink:href="jmir_v22i10e20346_app7.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 12 KB"/>
      </supplementary-material>
      <supplementary-material id="app8">
        <label>Multimedia Appendix 8</label>
        <p>Summary of the quality assessment and judgments of the cross-sectional studies using the Appraisal tool for Cross-Sectional Studies tool.</p>
        <media xlink:href="jmir_v22i10e20346_app8.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 14 KB"/>
      </supplementary-material>
      <supplementary-material id="app9">
        <label>Multimedia Appendix 9</label>
        <p>Summary of the quality assessment and judgments of the ‘other’ studies using the Appraisal tool for Cross-Sectional Studies tool.</p>
        <media xlink:href="jmir_v22i10e20346_app9.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 13 KB"/>
      </supplementary-material>
      <supplementary-material id="app10">
        <label>Multimedia Appendix 10</label>
        <p>Summary of the studies based on the evaluation outcomes from the synthesis framework for the assessment of health information technology differentiating between positive and mixed outcomes.</p>
        <media xlink:href="jmir_v22i10e20346_app10.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 82 KB"/>
      </supplementary-material>
      <supplementary-material id="app11">
        <label>Multimedia Appendix 11</label>
        <p>PRISMA (Preferred Reporting Items for Systematic Review and Meta-Analyses) checklist.</p>
        <media xlink:href="jmir_v22i10e20346_app11.doc" xlink:title="DOC File , 64 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AXIS</term>
          <def>
            <p>Appraisal tool for Cross-Sectional Studies</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CASP</term>
          <def>
            <p>Critical Appraisal Skills Programme</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">ECA</term>
          <def>
            <p>embodied conversational agent</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">ED</term>
          <def>
            <p>emergency department</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">IVR</term>
          <def>
            <p>interactive voice response</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">PRISMA</term>
          <def>
            <p>Preferred Reporting Items for Systematic Review and Meta-Analyses</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">RCT</term>
          <def>
            <p>randomized controlled trial</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">SF/HIT</term>
          <def>
            <p>synthesis framework for the assessment of health information technology</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors would like to thank the outreach librarians Liz Callow (University of Oxford) and Kirsten Elliot (Imperial College London), for their assistance in developing search terms and reviewing search strategies. Specific funding for this work has not been acquired. EM’s work on digital health solutions is currently supported by the Sir David Cooksey Fellowship in Healthcare Translation at the University of Oxford. The conclusions drawn in this paper were made by the authors and are not necessarily supported by the University of Oxford. The funding body had no role in the design, execution, or analysis of this systematic review.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>CC and EM conceived the study topic and designed the review protocol. CC and MMI screened the studies. CC conducted the data extraction, which was validated by MMI, and MMI conducted the risk-of-bias and quality assessments, which were validated by EM. MMI and EM analyzed the extracted data. The methods section was drafted by CC, and the rest of the review was written by MMI with revisions from EM. MHS, EL, NP, EN and GM provided feedback on the final drafted text. EM supervised the study execution. The authors confirm that they have followed all the appropriate research reporting guidelines. The PRISMA checklist for systematic reviews has been uploaded as <xref ref-type="supplementary-material" rid="app11">Multimedia Appendix 11</xref> along with other relevant materials.</p>
      </fn>
      <fn fn-type="conflict">
        <p>EL, NP, and GM are all employees of Ufonia Limited, a voice AI company. However, the paper was funded by the Sir David Cooksey Fellowship in Healthcare Translation at the University of Oxford, and Ufonia had no editorial influence on the final drafting. Their contribution was limited to feedback, given their applied voice AI expertise; therefore, no conflict of interest is identified.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bibault</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chaix</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Nectoux</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Pienkowsky</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Guillemasse</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Brouard</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Healthcare ex Machina: are conversational agents ready for prime time in oncology?</article-title>
          <source>Clin Transl Radiat Oncol</source>
          <year>2019</year>
          <month>05</month>
          <volume>16</volume>
          <fpage>55</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2405-6308(19)30015-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ctro.2019.04.002</pub-id>
          <pub-id pub-id-type="medline">31008379</pub-id>
          <pub-id pub-id-type="pii">S2405-6308(19)30015-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC6454131</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Laranjo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dunn</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Tong</surname>
              <given-names>HL</given-names>
            </name>
            <name name-style="western">
              <surname>Kocaballi</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bashir</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Surian</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gallego</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Magrabi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lau</surname>
              <given-names>AY</given-names>
            </name>
            <name name-style="western">
              <surname>Coiera</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Conversational agents in healthcare: a systematic review</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2018</year>
          <month>09</month>
          <day>1</day>
          <volume>25</volume>
          <issue>9</issue>
          <fpage>1248</fpage>
          <lpage>58</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30010941"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocy072</pub-id>
          <pub-id pub-id-type="medline">30010941</pub-id>
          <pub-id pub-id-type="pii">5052181</pub-id>
          <pub-id pub-id-type="pmcid">PMC6118869</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luxton</surname>
              <given-names>DD</given-names>
            </name>
          </person-group>
          <article-title>Ethical implications of conversational agents in global public health</article-title>
          <source>Bull World Health Organ</source>
          <year>2020</year>
          <month>04</month>
          <day>1</day>
          <volume>98</volume>
          <issue>4</issue>
          <fpage>285</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32284654"/>
          </comment>
          <pub-id pub-id-type="doi">10.2471/BLT.19.237636</pub-id>
          <pub-id pub-id-type="medline">32284654</pub-id>
          <pub-id pub-id-type="pii">BLT.19.237636</pub-id>
          <pub-id pub-id-type="pmcid">PMC7133471</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Davenport</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kalakota</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>The potential for artificial intelligence in healthcare</article-title>
          <source>Future Healthc J</source>
          <year>2019</year>
          <month>06</month>
          <volume>6</volume>
          <issue>2</issue>
          <fpage>94</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31363513"/>
          </comment>
          <pub-id pub-id-type="doi">10.7861/futurehosp.6-2-94</pub-id>
          <pub-id pub-id-type="medline">31363513</pub-id>
          <pub-id pub-id-type="pii">futurehealth</pub-id>
          <pub-id pub-id-type="pmcid">PMC6616181</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Montenegro</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>da Costa</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>da Rosa Righi</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Survey of conversational agents in health</article-title>
          <source>Expert Syst Appl</source>
          <year>2019</year>
          <month>09</month>
          <volume>129</volume>
          <fpage>56</fpage>
          <lpage>67</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://paperpile.com/b/dTKa6R/lJJR"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.eswa.2019.03.054</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weizenbaum</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>ELIZA — a computer program for the study of natural language communication between man and machine</article-title>
          <source>Commun ACM</source>
          <year>1983</year>
          <month>01</month>
          <volume>26</volume>
          <issue>1</issue>
          <fpage>23</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://paperpile.com/b/dTKa6R/6mwV"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/357980.357991</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Campillos-Llanos</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bilinski</surname>
              <given-names>?</given-names>
            </name>
            <name name-style="western">
              <surname>Zweigenbaum</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rosset</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Designing a virtual patient dialogue system based on terminology-rich resources: challenges and evaluation</article-title>
          <source>Nat Lang Eng</source>
          <year>2019</year>
          <month>07</month>
          <day>15</day>
          <fpage>1</fpage>
          <lpage>38</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://paperpile.com/b/dTKa6R/RdsW"/>
          </comment>
          <pub-id pub-id-type="doi">10.1017/s1351324919000329</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sheng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Developing a wireless speech- and touch-based intelligent comprehensive triage support system</article-title>
          <source>Comput Inform Nurs</source>
          <year>2008</year>
          <volume>26</volume>
          <issue>1</issue>
          <fpage>31</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1097/01.NCN.0000304754.49116.b4</pub-id>
          <pub-id pub-id-type="medline">18091619</pub-id>
          <pub-id pub-id-type="pii">00024665-200801000-00009</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adams</surname>
              <given-names>WG</given-names>
            </name>
            <name name-style="western">
              <surname>Phillips</surname>
              <given-names>BD</given-names>
            </name>
            <name name-style="western">
              <surname>Bacic</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Walsh</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Shanahan</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Paasche-Orlow</surname>
              <given-names>MK</given-names>
            </name>
          </person-group>
          <article-title>Automated conversation system before pediatric primary care visits: a randomized trial</article-title>
          <source>Pediatrics</source>
          <year>2014</year>
          <month>09</month>
          <volume>134</volume>
          <issue>3</issue>
          <fpage>e691</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1542/peds.2013-3759</pub-id>
          <pub-id pub-id-type="medline">25092938</pub-id>
          <pub-id pub-id-type="pii">peds.2013-3759</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kocaballi</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Berkovsky</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Quiroz</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Laranjo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tong</surname>
              <given-names>HL</given-names>
            </name>
            <name name-style="western">
              <surname>Rezazadegan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Briatore</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Coiera</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>The personalization of conversational agents in health care: systematic review</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>11</month>
          <day>7</day>
          <volume>21</volume>
          <issue>11</issue>
          <fpage>e15360</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/11/e15360/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/15360</pub-id>
          <pub-id pub-id-type="medline">31697237</pub-id>
          <pub-id pub-id-type="pii">v21i11e15360</pub-id>
          <pub-id pub-id-type="pmcid">PMC6873147</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Aldunate</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ratnam</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Jain</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Morrow</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sosnoff</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Validity and usability of an automated fall risk assessment tool for older adults internet</article-title>
          <source>Innov Aging</source>
          <year>2018</year>
          <fpage>362</fpage>
          <pub-id pub-id-type="doi">10.1093/geroni/igy023.1338</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nakagawa</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Enomoto</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Yonekura</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kanazawa</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kuniyoshi</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>A Telecare System that Estimates Quality of Life through Communication</article-title>
          <source>International Conference on Cloud Computing and Intelligence Systems</source>
          <year>2018</year>
          <conf-name>CCIS'18</conf-name>
          <conf-date>November 23-25, 2018</conf-date>
          <conf-loc>Nanjing, China</conf-loc>
          <pub-id pub-id-type="doi">10.1109/ccis.2018.8691360</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fitzpatrick</surname>
              <given-names>KK</given-names>
            </name>
            <name name-style="western">
              <surname>Darcy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Vierhile</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Delivering cognitive behavior therapy to young adults with symptoms of depression and anxiety using a fully automated conversational agent (WOEBOT): a randomized controlled trial</article-title>
          <source>JMIR Ment Health</source>
          <year>2017</year>
          <month>06</month>
          <day>6</day>
          <volume>4</volume>
          <issue>2</issue>
          <fpage>e19</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mental.jmir.org/2017/2/e19/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/mental.7785</pub-id>
          <pub-id pub-id-type="medline">28588005</pub-id>
          <pub-id pub-id-type="pii">v4i2e19</pub-id>
          <pub-id pub-id-type="pmcid">PMC5478797</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Håvik</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wake</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Flobak</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Lundervold</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Guribye</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>A conversational interface for self-screening for ADHD in adults</article-title>
          <source>Internet Sci</source>
          <year>2019</year>
          <fpage>144</fpage>
          <pub-id pub-id-type="doi">10.1007/978-3-030-17705-8_12</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Isaza-Restrepo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gómez</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Cifuentes</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Argüello</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>The virtual patient as a learning tool: a mixed quantitative qualitative study</article-title>
          <source>BMC Med Educ</source>
          <year>2018</year>
          <month>12</month>
          <day>6</day>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>297</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmededuc.biomedcentral.com/articles/10.1186/s12909-018-1395-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12909-018-1395-8</pub-id>
          <pub-id pub-id-type="medline">30522478</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12909-018-1395-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC6282259</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van Heerden</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ntinga</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Vilakazi</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>The Potential of Conversational Agents to Provide a Rapid HIV Counseling and Testing Services</article-title>
          <source>International Conference on the Frontiers and Advances in Data Science</source>
          <year>2017</year>
          <conf-name>FADS'17</conf-name>
          <conf-date>October 23-25, 2017</conf-date>
          <conf-loc>Xi'an, China</conf-loc>
          <pub-id pub-id-type="doi">10.1109/fads.2017.8253198</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bickmore</surname>
              <given-names>TW</given-names>
            </name>
            <name name-style="western">
              <surname>Pfeifer</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Byron</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Forsythe</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Henault</surname>
              <given-names>LE</given-names>
            </name>
            <name name-style="western">
              <surname>Jack</surname>
              <given-names>BW</given-names>
            </name>
            <name name-style="western">
              <surname>Silliman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Paasche-Orlow</surname>
              <given-names>MK</given-names>
            </name>
          </person-group>
          <article-title>Usability of conversational agents by patients with inadequate health literacy: evidence from two clinical trials</article-title>
          <source>J Health Commun</source>
          <year>2010</year>
          <volume>15</volume>
          <issue>Suppl 2</issue>
          <fpage>197</fpage>
          <lpage>210</lpage>
          <pub-id pub-id-type="doi">10.1080/10810730.2010.499991</pub-id>
          <pub-id pub-id-type="medline">20845204</pub-id>
          <pub-id pub-id-type="pii">926954323</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Bickmore</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Medical Shared Decision Making with a Virtual Agent</article-title>
          <source>Proceedings of the 18th International Conference on Intelligent Virtual Agents</source>
          <year>2018</year>
          <conf-name>IVA'18</conf-name>
          <conf-date>November 5-8, 2018</conf-date>
          <conf-loc>Sydney, NSW, Australia,</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3267851.3267883</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vaidyam</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Wisniewski</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Halamka</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Kashavan</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Torous</surname>
              <given-names>JB</given-names>
            </name>
          </person-group>
          <article-title>Chatbots and conversational agents in mental health: a review of the psychiatric landscape</article-title>
          <source>Can J Psychiatry</source>
          <year>2019</year>
          <month>07</month>
          <volume>64</volume>
          <issue>7</issue>
          <fpage>456</fpage>
          <lpage>64</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30897957"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/0706743719828977</pub-id>
          <pub-id pub-id-type="medline">30897957</pub-id>
          <pub-id pub-id-type="pmcid">PMC6610568</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Russo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>D'Onofrio</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gangemi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Giuliani</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Mongiovi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ricciardi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Greco</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Cavallo</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Dario</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sancarlo</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Presutti</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Greco</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Dialogue systems and conversational agents for patients with dementia: the human-robot interaction</article-title>
          <source>Rejuvenation Res</source>
          <year>2019</year>
          <month>04</month>
          <volume>22</volume>
          <issue>2</issue>
          <fpage>109</fpage>
          <lpage>20</lpage>
          <pub-id pub-id-type="doi">10.1089/rej.2018.2075</pub-id>
          <pub-id pub-id-type="medline">30033861</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xing</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Qanir</surname>
              <given-names>YA</given-names>
            </name>
            <name name-style="western">
              <surname>Guan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Walker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Intelligent conversational agents in patient self-management: a systematic survey using multi data sources</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2019</year>
          <month>08</month>
          <day>21</day>
          <volume>264</volume>
          <fpage>1813</fpage>
          <lpage>4</lpage>
          <pub-id pub-id-type="doi">10.3233/SHTI190661</pub-id>
          <pub-id pub-id-type="medline">31438357</pub-id>
          <pub-id pub-id-type="pii">SHTI190661</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Provoost</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lau</surname>
              <given-names>HM</given-names>
            </name>
            <name name-style="western">
              <surname>Ruwaard</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Riper</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Embodied conversational agents in clinical psychology: a scoping review</article-title>
          <source>J Med Internet Res</source>
          <year>2017</year>
          <month>05</month>
          <day>9</day>
          <volume>19</volume>
          <issue>5</issue>
          <fpage>e151</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2017/5/e151/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.6553</pub-id>
          <pub-id pub-id-type="medline">28487267</pub-id>
          <pub-id pub-id-type="pii">v19i5e151</pub-id>
          <pub-id pub-id-type="pmcid">PMC5442350</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Safi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Thiessen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Schmailzl</surname>
              <given-names>KJ</given-names>
            </name>
          </person-group>
          <article-title>Acceptance and resistance of new digital technologies in medicine: qualitative study</article-title>
          <source>JMIR Res Protoc</source>
          <year>2018</year>
          <month>12</month>
          <day>4</day>
          <volume>7</volume>
          <issue>12</issue>
          <fpage>e11072</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchprotocols.org/2018/12/e11072/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/11072</pub-id>
          <pub-id pub-id-type="medline">30514693</pub-id>
          <pub-id pub-id-type="pii">v7i12e11072</pub-id>
          <pub-id pub-id-type="pmcid">PMC6299231</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>de Cock</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Milne-Ives</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>van Velthoven</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Alturkistani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lam</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Meinert</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Effectiveness of conversational agents (virtual assistants) in health care: protocol for a systematic review</article-title>
          <source>JMIR Res Protoc</source>
          <year>2020</year>
          <month>03</month>
          <day>9</day>
          <volume>9</volume>
          <issue>3</issue>
          <fpage>e16934</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchprotocols.org/2020/3/e16934/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/16934</pub-id>
          <pub-id pub-id-type="medline">32149717</pub-id>
          <pub-id pub-id-type="pii">v9i3e16934</pub-id>
          <pub-id pub-id-type="pmcid">PMC7091022</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schardt</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Adams</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Owens</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Keitz</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fontelo</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Utilization of the PICO framework to improve searching PubMed for clinical questions</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2007</year>
          <month>06</month>
          <day>15</day>
          <volume>7</volume>
          <fpage>16</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/1472-6947-7-16"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1472-6947-7-16</pub-id>
          <pub-id pub-id-type="medline">17573961</pub-id>
          <pub-id pub-id-type="pii">1472-6947-7-16</pub-id>
          <pub-id pub-id-type="pmcid">PMC1904193</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shamseer</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Moher</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Clarke</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ghersi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Liberati</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Petticrew</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shekelle</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>LA</given-names>
            </name>
            <collab>PRISMA-P Group</collab>
          </person-group>
          <article-title>Preferred reporting items for systematic review and meta-analysis protocols (PRISMA-P) 2015: elaboration and explanation</article-title>
          <source>Br Med J</source>
          <year>2015</year>
          <month>01</month>
          <day>2</day>
          <volume>350</volume>
          <fpage>g7647</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.bmj.com/cgi/pmidlookup?view=long&#38;pmid=25555855"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.g7647</pub-id>
          <pub-id pub-id-type="medline">25555855</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Higgins</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Cochrane Handbook for Systematic Reviews of Interventions</article-title>
          <source>2019. ISBN</source>
          <year>2019</year>
          <fpage>9781119536628</fpage>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Higgins</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>DG</given-names>
            </name>
            <name name-style="western">
              <surname>Gøtzsche</surname>
              <given-names>PC</given-names>
            </name>
            <name name-style="western">
              <surname>Jüni</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Moher</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Oxman</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Savovic</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schulz</surname>
              <given-names>KF</given-names>
            </name>
            <name name-style="western">
              <surname>Weeks</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sterne</surname>
              <given-names>JAC</given-names>
            </name>
            <collab>Cochrane Bias Methods Group</collab>
            <collab>Cochrane Statistical Methods Group</collab>
          </person-group>
          <article-title>The cochrane collaboration's tool for assessing risk of bias in randomised trials</article-title>
          <source>Br Med J</source>
          <year>2011</year>
          <month>10</month>
          <day>18</day>
          <volume>343</volume>
          <fpage>d5928</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22008217"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.d5928</pub-id>
          <pub-id pub-id-type="medline">22008217</pub-id>
          <pub-id pub-id-type="pmcid">PMC3196245</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
          <article-title>CASP Checklists</article-title>
          <source>Critical Appraisal Skills Programme: CASP</source>
          <access-date>2020-09-11</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://casp-uk.net/casp-tools-checklists/">https://casp-uk.net/casp-tools-checklists/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Downes</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Brennan</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>HC</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>RS</given-names>
            </name>
          </person-group>
          <article-title>Development of a critical appraisal tool to assess the quality of cross-sectional studies (AXIS)</article-title>
          <source>BMJ Open</source>
          <year>2016</year>
          <month>12</month>
          <day>8</day>
          <volume>6</volume>
          <issue>12</issue>
          <fpage>e011458</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://bmjopen.bmj.com/cgi/pmidlookup?view=long&#38;pmid=27932337"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2016-011458</pub-id>
          <pub-id pub-id-type="medline">27932337</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2016-011458</pub-id>
          <pub-id pub-id-type="pmcid">PMC5168618</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Christopoulou</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Kotsilieris</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Anagnostopoulos</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Assessment of health information technology interventions in evidence-based medicine: a systematic review by adopting a methodological evaluation framework</article-title>
          <source>Healthcare (Basel)</source>
          <year>2018</year>
          <month>08</month>
          <day>31</day>
          <volume>6</volume>
          <issue>3</issue>
          <fpage>-</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=healthcare6030109"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/healthcare6030109</pub-id>
          <pub-id pub-id-type="medline">30200307</pub-id>
          <pub-id pub-id-type="pii">healthcare6030109</pub-id>
          <pub-id pub-id-type="pmcid">PMC6165327</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cameron</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cameron</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Megaw</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bond</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mulvenna</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>O?Neill</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Armour</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>McTear</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>Assessing the Usability of a Chatbot for Mental Health Care</source>
          <year>2019</year>
          <publisher-loc>In</publisher-loc>
          <publisher-name>Bodrunova S.  Internet Science., editor. Lecture Notes in Computer Science, vol 11551 Springer, Cham</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Elmasri</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Maeder</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A Conversational Agent for an Online Mental Health Intervention Internet</article-title>
          <source>Brain Informatics and Health.?</source>
          <year>2016</year>
          <fpage>251</fpage>
          <pub-id pub-id-type="doi">10.1007/978-3-319-47103-7_24</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fulmer</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Joerin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gentile</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lakerink</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Rauws</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A conversational agent for an online mental health intervention internetusing psychological artificial intelligence (Tess) to relieve symptoms of depression and anxiety: randomized controlled trial</article-title>
          <source>JMIR Ment Health</source>
          <year>2018</year>
          <month>12</month>
          <day>13</day>
          <volume>5</volume>
          <issue>4</issue>
          <fpage>e64</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mental.jmir.org/2018/4/e64/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/mental.9782</pub-id>
          <pub-id pub-id-type="medline">30545815</pub-id>
          <pub-id pub-id-type="pii">v5i4e64</pub-id>
          <pub-id pub-id-type="pmcid">PMC6315222</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hudlicka</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Virtual training and coaching of health behavior: example from mindfulness meditation training</article-title>
          <source>Patient Educ Couns</source>
          <year>2013</year>
          <month>08</month>
          <volume>92</volume>
          <issue>2</issue>
          <fpage>160</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23809167"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.pec.2013.05.007</pub-id>
          <pub-id pub-id-type="medline">23809167</pub-id>
          <pub-id pub-id-type="pii">S0738-3991(13)00207-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC3970714</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Inkster</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Sarda</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Subramanian</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>An empathy-driven, conversational artificial intelligence agent (Wysa) for digital mental well-being: real-world data evaluation mixed-methods study</article-title>
          <source>JMIR Mhealth Uhealth</source>
          <year>2018</year>
          <month>11</month>
          <day>23</day>
          <volume>6</volume>
          <issue>11</issue>
          <fpage>e12106</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mhealth.jmir.org/2018/11/e12106/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/12106</pub-id>
          <pub-id pub-id-type="medline">30470676</pub-id>
          <pub-id pub-id-type="pii">v6i11e12106</pub-id>
          <pub-id pub-id-type="pmcid">PMC6286427</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ly</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Ly</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Andersson</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>A fully automated conversational agent for promoting mental well-being: a pilot RCT using mixed methods</article-title>
          <source>Internet Interv</source>
          <year>2017</year>
          <month>12</month>
          <volume>10</volume>
          <fpage>39</fpage>
          <lpage>46</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2214-7829(17)30091-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.invent.2017.10.002</pub-id>
          <pub-id pub-id-type="medline">30135751</pub-id>
          <pub-id pub-id-type="pii">S2214-7829(17)30091-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC6084875</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Philip</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Micoulaud-Franchi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sagaspe</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sevin</surname>
              <given-names>ED</given-names>
            </name>
            <name name-style="western">
              <surname>Olive</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bioulac</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sauteraud</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Virtual human as a new diagnostic tool, a proof of concept study in the field of major depressive disorders</article-title>
          <source>Sci Rep</source>
          <year>2017</year>
          <month>02</month>
          <day>16</day>
          <volume>7</volume>
          <fpage>42656</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.doi.org/10.1038/srep42656"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/srep42656</pub-id>
          <pub-id pub-id-type="medline">28205601</pub-id>
          <pub-id pub-id-type="pii">srep42656</pub-id>
          <pub-id pub-id-type="pmcid">PMC5311989</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yasavur</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Lisetti</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rishe</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Let’s talk! speaking virtual counselor offers you a brief intervention</article-title>
          <source>J Multimodal User Interfaces</source>
          <year>2014</year>
          <month>09</month>
          <day>5</day>
          <volume>8</volume>
          <issue>4</issue>
          <fpage>381</fpage>
          <lpage>98</lpage>
          <pub-id pub-id-type="doi">10.1007/s12193-014-0169-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mei</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Judkins</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Cannizzaro</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>A voice-based automated system for PTSD screening and monitoring</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2012</year>
          <volume>173</volume>
          <fpage>552</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="medline">22357057</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Washburn</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bordnick</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rizzo</surname>
              <given-names>AS</given-names>
            </name>
          </person-group>
          <article-title>A pilot feasibility study of virtual patient simulation to enhance social work students' brief mental health assessment skills</article-title>
          <source>Soc Work Health Care</source>
          <year>2016</year>
          <month>10</month>
          <volume>55</volume>
          <issue>9</issue>
          <fpage>675</fpage>
          <lpage>93</lpage>
          <pub-id pub-id-type="doi">10.1080/00981389.2016.1210715</pub-id>
          <pub-id pub-id-type="medline">27552646</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dimeff</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Jobes</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Chalker</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Piehl</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Duvivier</surname>
              <given-names>LL</given-names>
            </name>
            <name name-style="western">
              <surname>Lok</surname>
              <given-names>BC</given-names>
            </name>
            <name name-style="western">
              <surname>Zalake</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Koerner</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>A novel engagement of suicidality in the emergency department: virtual collaborative assessment and management of suicidality</article-title>
          <source>Gen Hosp Psychiatry</source>
          <year>2020</year>
          <volume>63</volume>
          <fpage>119</fpage>
          <lpage>26</lpage>
          <pub-id pub-id-type="doi">10.1016/j.genhosppsych.2018.05.005</pub-id>
          <pub-id pub-id-type="medline">29934033</pub-id>
          <pub-id pub-id-type="pii">S0163-8343(18)30088-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Spänig</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Emberger-Klein</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sowa</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Canbay</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Menrad</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Heider</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The virtual doctor: an interactive clinical-decision-support system based on deep learning for non-invasive prediction of diabetes</article-title>
          <source>Artif Intell Med</source>
          <year>2019</year>
          <month>09</month>
          <volume>100</volume>
          <fpage>101706</fpage>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2019.101706</pub-id>
          <pub-id pub-id-type="medline">31607340</pub-id>
          <pub-id pub-id-type="pii">S0933-3657(19)30108-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ghosh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bhatia</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bhatia</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Quro: facilitating user symptom check using a personalised chatbot-oriented dialogue system</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2018</year>
          <volume>252</volume>
          <fpage>51</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="medline">30040682</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chaix</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bibault</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pienkowski</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Delamon</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Guillemassé</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nectoux</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Brouard</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>When chatbots meet patients: one-year prospective study of conversations between patients with breast cancer and a chatbot</article-title>
          <source>JMIR Cancer</source>
          <year>2019</year>
          <month>05</month>
          <day>2</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>e12856</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cancer.jmir.org/2019/1/e12856/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/12856</pub-id>
          <pub-id pub-id-type="medline">31045505</pub-id>
          <pub-id pub-id-type="pii">v5i1e12856</pub-id>
          <pub-id pub-id-type="pmcid">PMC6521209</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bibault</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chaix</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Guillemassé</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cousin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Escande</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Perrin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pienkowski</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Delamon</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Nectoux</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Brouard</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>A chatbot versus physicians to provide information for patients with breast cancer: blind, randomized controlled noninferiority trial</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>11</month>
          <day>27</day>
          <volume>21</volume>
          <issue>11</issue>
          <fpage>e15787</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/11/e15787/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/15787</pub-id>
          <pub-id pub-id-type="medline">31774408</pub-id>
          <pub-id pub-id-type="pii">v21i11e15787</pub-id>
          <pub-id pub-id-type="pmcid">PMC6906616</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Heyworth</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Kleinman</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Oddleifson</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bernstein</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Frampton</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lehrer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Salvato</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Weiss</surname>
              <given-names>TW</given-names>
            </name>
            <name name-style="western">
              <surname>Simon</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Connelly</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Comparison of interactive voice response, patient mailing, and mailed registry to encourage screening for osteoporosis: a randomized controlled trial</article-title>
          <source>Osteoporos Int</source>
          <year>2014</year>
          <month>05</month>
          <volume>25</volume>
          <issue>5</issue>
          <fpage>1519</fpage>
          <lpage>26</lpage>
          <pub-id pub-id-type="doi">10.1007/s00198-014-2629-1</pub-id>
          <pub-id pub-id-type="medline">24566584</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rhee</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mammen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Swift</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Mobile phone-based asthma self-management aid for adolescents (mASMAA): a feasibility study</article-title>
          <source>Patient Prefer Adherence</source>
          <year>2014</year>
          <volume>8</volume>
          <fpage>63</fpage>
          <lpage>72</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.doi.org/10.2147/PPA.S53504"/>
          </comment>
          <pub-id pub-id-type="doi">10.2147/PPA.S53504</pub-id>
          <pub-id pub-id-type="medline">24470755</pub-id>
          <pub-id pub-id-type="pii">ppa-8-063</pub-id>
          <pub-id pub-id-type="pmcid">PMC3891581</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Simon</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Soumerai</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Ensroth</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bernstein</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Fletcher</surname>
              <given-names>RH</given-names>
            </name>
            <name name-style="western">
              <surname>Ross-Degnan</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Failure of automated telephone outreach with speech recognition to improve colorectal cancer screening: a randomized controlled trial</article-title>
          <source>Arch Intern Med</source>
          <year>2010</year>
          <month>02</month>
          <day>8</day>
          <volume>170</volume>
          <issue>3</issue>
          <fpage>264</fpage>
          <lpage>70</lpage>
          <pub-id pub-id-type="doi">10.1001/archinternmed.2009.522</pub-id>
          <pub-id pub-id-type="medline">20142572</pub-id>
          <pub-id pub-id-type="pii">170/3/264</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Borja-Hart</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Spivey</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>George</surname>
              <given-names>CM</given-names>
            </name>
          </person-group>
          <article-title>Use of virtual patient software to assess student confidence and ability in communication skills and virtual patient impression: a mixed-methods approach</article-title>
          <source>Curr Pharm Teach Learn</source>
          <year>2019</year>
          <month>07</month>
          <volume>11</volume>
          <issue>7</issue>
          <fpage>710</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1016/j.cptl.2019.03.009</pub-id>
          <pub-id pub-id-type="medline">31227094</pub-id>
          <pub-id pub-id-type="pii">S1877-1297(18)30168-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Philip</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bioulac</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sauteraud</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chaufton</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Olive</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Could a virtual human be used to explore excessive daytime sleepiness in patients?</article-title>
          <source>Presence</source>
          <year>2014</year>
          <month>11</month>
          <day>1</day>
          <volume>23</volume>
          <issue>4</issue>
          <fpage>369</fpage>
          <lpage>76</lpage>
          <pub-id pub-id-type="doi">10.1162/pres_a_00197</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Galescu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ferguson</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Quinn</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Swift</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Speech Recognition in a Dialog System for Patient Health Monitoring</article-title>
          <source>International Conference on Bioinformatics and Biomedicine Workshop</source>
          <year>2009</year>
          <conf-name>BIBMW'09</conf-name>
          <conf-date>November 1-4, 2009</conf-date>
          <conf-loc>Washington, DC</conf-loc>
          <pub-id pub-id-type="doi">10.1109/bibmw.2009.5332111</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Friederichs</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bolman</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Oenema</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Guyaux</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lechner</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Motivational interviewing in a web-based physical activity intervention with an avatar: randomized controlled trial</article-title>
          <source>J Med Internet Res</source>
          <year>2014</year>
          <month>02</month>
          <day>13</day>
          <volume>16</volume>
          <issue>2</issue>
          <fpage>e48</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2014/2/e48/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.2974</pub-id>
          <pub-id pub-id-type="medline">24550153</pub-id>
          <pub-id pub-id-type="pii">v16i2e48</pub-id>
          <pub-id pub-id-type="pmcid">PMC3936285</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Crutzen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>GY</given-names>
            </name>
            <name name-style="western">
              <surname>Portugal</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Fisser</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Grolleman</surname>
              <given-names>JJ</given-names>
            </name>
          </person-group>
          <article-title>An artificially intelligent chat agent that answers adolescents' questions related to sex, drugs, and alcohol: an exploratory study</article-title>
          <source>J Adolesc Health</source>
          <year>2011</year>
          <month>05</month>
          <volume>48</volume>
          <issue>5</issue>
          <fpage>514</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jadohealth.2010.09.002</pub-id>
          <pub-id pub-id-type="medline">21501812</pub-id>
          <pub-id pub-id-type="pii">S1054-139X(10)00430-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Thangarajah</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Padgham</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Contextual question answering for the health domain</article-title>
          <source>J Am Soc Inf Sci Tec</source>
          <year>2012</year>
          <month>10</month>
          <day>30</day>
          <volume>63</volume>
          <issue>11</issue>
          <fpage>2313</fpage>
          <lpage>27</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://paperpile.com/b/lTuu8U/zXRk"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/asi.22733</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ireland</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Atay</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liddle</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bradford</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rushin</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Mullins</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Angus</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wiles</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>McBride</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Vogel</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Hello Harlie: enabling speech monitoring through chat-bot conversations</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2016</year>
          <volume>227</volume>
          <fpage>55</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="medline">27440289</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="web">
          <article-title>Copenhagen: The Nordic Cochrane Centre</article-title>
          <source>RevMan</source>
          <access-date>2020-09-11</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://community.cochrane.org/help/tools-and-software/revman-5">https://community.cochrane.org/help/tools-and-software/revman-5</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Greenhalgh</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wherton</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Papoutsi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lynch</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hughes</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>A'Court</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hinder</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fahy</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Procter</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Shaw</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Beyond adoption: a new framework for theorizing and evaluating nonadoption, abandonment, and challenges to the scale-up, spread, and sustainability of health and care technologies</article-title>
          <source>J Med Internet Res</source>
          <year>2017</year>
          <month>11</month>
          <day>1</day>
          <volume>19</volume>
          <issue>11</issue>
          <fpage>e367</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2017/11/e367/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.8775</pub-id>
          <pub-id pub-id-type="medline">29092808</pub-id>
          <pub-id pub-id-type="pii">v19i11e367</pub-id>
          <pub-id pub-id-type="pmcid">PMC5688245</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Michie</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>van Stralen</surname>
              <given-names>Maartje M</given-names>
            </name>
            <name name-style="western">
              <surname>West</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>The behaviour change wheel: a new method for characterising and designing behaviour change interventions</article-title>
          <source>Implement Sci</source>
          <year>2011</year>
          <month>04</month>
          <day>23</day>
          <volume>6</volume>
          <fpage>42</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://implementationscience.biomedcentral.com/articles/10.1186/1748-5908-6-42"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1748-5908-6-42</pub-id>
          <pub-id pub-id-type="medline">21513547</pub-id>
          <pub-id pub-id-type="pii">1748-5908-6-42</pub-id>
          <pub-id pub-id-type="pmcid">PMC3096582</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meinert</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Alturkistani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Brindley</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Knight</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wells</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Pennington</surname>
              <given-names>ND</given-names>
            </name>
          </person-group>
          <article-title>The technological imperative for value-based health care</article-title>
          <source>Br J Hosp Med (Lond)</source>
          <year>2018</year>
          <month>06</month>
          <day>2</day>
          <volume>79</volume>
          <issue>6</issue>
          <fpage>328</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.12968/hmed.2018.79.6.328</pub-id>
          <pub-id pub-id-type="medline">29894248</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
