<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="review-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v26i1e52597</article-id>
      <article-id pub-id-type="pmid">39661968</article-id>
      <article-id pub-id-type="doi">10.2196/52597</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Review</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Review</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Large Language Models and Empathy: Systematic Review</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Long</surname>
            <given-names>Xiao</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Pandey</surname>
            <given-names>Sachin</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Ilicki</surname>
            <given-names>Jonathan</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Tabaie</surname>
            <given-names>Azade</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Sorin</surname>
            <given-names>Vera</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Radiology</institution>
            <institution>Mayo Clinic</institution>
            <addr-line>200 First Street SW</addr-line>
            <addr-line>Rochester, MN, 55905</addr-line>
            <country>United States</country>
            <phone>1 5072842511</phone>
            <email>verasrn@gmail.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0509-4686</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Brin</surname>
            <given-names>Dana</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0003-7316-206X</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Barash</surname>
            <given-names>Yiftach</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7242-1328</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Konen</surname>
            <given-names>Eli</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9507-2450</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Charney</surname>
            <given-names>Alexander</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8135-6858</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Nadkarni</surname>
            <given-names>Girish</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6319-4314</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Klang</surname>
            <given-names>Eyal</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4567-3108</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Radiology</institution>
        <institution>Mayo Clinic</institution>
        <addr-line>Rochester, MN</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Diagnostic Imaging</institution>
        <institution>Sheba Medical Center</institution>
        <addr-line>Ramat Gan</addr-line>
        <country>Israel</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>The Faculty of Medicine</institution>
        <institution>Tel Aviv University</institution>
        <addr-line>Tel Aviv</addr-line>
        <country>Israel</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>DeepVision Lab</institution>
        <institution>Chaim Sheba Medical Center</institution>
        <addr-line>Tel Hashomer</addr-line>
        <country>Israel</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Division of Data-Driven and Digital Medicine</institution>
        <institution>Icahn School of Medicine at Mount Sinai</institution>
        <addr-line>New York, NY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>The Charles Bronfman Institute of Personalized Medicine</institution>
        <institution>Icahn School of Medicine at Mount Sinai</institution>
        <addr-line>New York, NY</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Vera Sorin <email>verasrn@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>11</day>
        <month>12</month>
        <year>2024</year>
      </pub-date>
      <volume>26</volume>
      <elocation-id>e52597</elocation-id>
      <history>
        <date date-type="received">
          <day>9</day>
          <month>9</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>1</day>
          <month>2</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>27</day>
          <month>2</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>20</day>
          <month>10</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Vera Sorin, Dana Brin, Yiftach Barash, Eli Konen, Alexander Charney, Girish Nadkarni, Eyal Klang. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 11.12.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2024/1/e52597" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Empathy, a fundamental aspect of human interaction, is characterized as the ability to experience another being’s emotions within oneself. In health care, empathy is a fundamental for health care professionals and patients’ interaction. It is a unique quality to humans that large language models (LLMs) are believed to lack.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We aimed to review the literature on the capacity of LLMs in demonstrating empathy.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We conducted a literature search on MEDLINE, Google Scholar, PsyArXiv, medRxiv, and arXiv between December 2022 and February 2024. We included English-language full-length publications that evaluated empathy in LLMs’ outputs. We excluded papers evaluating other topics related to emotional intelligence that were not specifically empathy. The included studies’ results, including the LLMs used, performance in empathy tasks, and limitations of the models, along with studies’ metadata were summarized.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>A total of 12 studies published in 2023 met the inclusion criteria. ChatGPT-3.5 (OpenAI) was evaluated in all studies, with 6 studies comparing it with other LLMs such GPT-4, LLaMA (Meta), and fine-tuned chatbots. Seven studies focused on empathy within a medical context. The studies reported LLMs to exhibit elements of empathy, including emotions recognition and emotional support in diverse contexts. Evaluation metric included automatic metrics such as Recall-Oriented Understudy for Gisting Evaluation and Bilingual Evaluation Understudy, and human subjective evaluation. Some studies compared performance on empathy with humans, while others compared between different models. In some cases, LLMs were observed to outperform humans in empathy-related tasks. For example, ChatGPT-3.5 was evaluated for its responses to patients’ questions from social media, where ChatGPT’s responses were preferred over those of humans in 78.6% of cases. Other studies used subjective readers’ assigned scores. One study reported a mean empathy score of 1.84-1.9 (scale 0-2) for their fine-tuned LLM, while a different study evaluating ChatGPT-based chatbots reported a mean human rating of 3.43 out of 4 for empathetic responses. Other evaluations were based on the level of the emotional awareness scale, which was reported to be higher for ChatGPT-3.5 than for humans. Another study evaluated ChatGPT and GPT-4 on soft-skills questions in the United States Medical Licensing Examination, where GPT-4 answered 90% of questions correctly. Limitations were noted, including repetitive use of empathic phrases, difficulty following initial instructions, overly lengthy responses, sensitivity to prompts, and overall subjective evaluation metrics influenced by the evaluator’s background.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>LLMs exhibit elements of cognitive empathy, recognizing emotions and providing emotionally supportive responses in various contexts. Since social skills are an integral part of intelligence, these advancements bring LLMs closer to human-like interactions and expand their potential use in applications requiring emotional intelligence. However, there remains room for improvement in both the performance of these models and the evaluation strategies used for assessing soft skills.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>empathy</kwd>
        <kwd>LLMs</kwd>
        <kwd>AI</kwd>
        <kwd>ChatGPT</kwd>
        <kwd>review methods</kwd>
        <kwd>review methodology</kwd>
        <kwd>systematic review</kwd>
        <kwd>scoping</kwd>
        <kwd>synthesis</kwd>
        <kwd>foundation models</kwd>
        <kwd>text-based</kwd>
        <kwd>human interaction</kwd>
        <kwd>emotional intelligence</kwd>
        <kwd>objective metrics</kwd>
        <kwd>human assessment</kwd>
        <kwd>emotions</kwd>
        <kwd>healthcare</kwd>
        <kwd>cognitive</kwd>
        <kwd>PRISMA</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Empathy, a fundamental aspect of human interaction, can be characterized as the ability to experience the emotions of another being within oneself. The origin of the word “empathy” dates back to the 1880s, when Theodore Lipps determined the word “einfuhlung” (“in-feeling”) to describe the emotional appreciation of another’s feelings [<xref ref-type="bibr" rid="ref1">1</xref>]. Empathy involves recognition of others’ feelings, the causes of these feelings, and the ability to participate in an emotional experience of an individual without becoming part of it [<xref ref-type="bibr" rid="ref1">1</xref>].</p>
      <p>Empathy is described as “the ability to see the world through someone else’s eyes,” having the ability to imagine what someone else is thinking and feeling in a given situation [<xref ref-type="bibr" rid="ref2">2</xref>]. It is commonly understood to encompass cognitive and affective components: the ability to understand another’s feelings (cognitive empathy) and to experience emotions in response to others (affective empathy) [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref3">3</xref>].</p>
      <p>In health care, empathy has an important role in patient care, improving patient satisfaction and treatment adherence. Empathy allows health care professionals to understand the emotional and psychological states of patients, fostering better communication and trust [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
      <p>Large language models (LLMs) have demonstrated remarkable capabilities across various tasks, including text summarization, question-answering, and text generation [<xref ref-type="bibr" rid="ref5">5</xref>]. There are numerous studies on potential applications in health care, as an educational tool and as a support tool in clinical work [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. These models are already being integrated into practice. For instance, Epic has integrated GPT4 in its electronic health record software [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>].</p>
      <p>While LLMs have the potential to improve and automate some medical tasks, there are significant limitations to these models and their integration [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. Despite the promising natural language processing capabilities, these models make errors and their performance in clinical tasks is challenging to evaluate on a large scale [<xref ref-type="bibr" rid="ref12">12</xref>]. Many studies thus rely on multiple-choice questions assessment, which do not reflect real-world clinical applications [<xref ref-type="bibr" rid="ref13">13</xref>]. These models can introduce bias [<xref ref-type="bibr" rid="ref14">14</xref>], and can be susceptible to cyberattacks [<xref ref-type="bibr" rid="ref15">15</xref>]. Some studies that evaluated these models for medical tasks suggested that despite impressive capabilities, LLMs lack empathy, a quality that is unique to humans and is imperative in health care [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref19">19</xref>].</p>
      <p>Recent studies discuss and evaluate LLMs performance in tasks related to emotional intelligence, theory of mind, and empathy [<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref25">25</xref>]. Some evidence suggests that these models may show aspects of cognitive empathy, including emotions recognition and providing supportive responses [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref28">28</xref>]. Furthermore, commercial LLM-based applications are being developed to offer emotional support to patients [<xref ref-type="bibr" rid="ref29">29</xref>]. Given these developments, the aim of our study was to systematically review the literature on the capacity of LLMs in demonstrating empathy.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <p>We searched the literature on LLMs and empathy using MEDLINE, Google Scholar, PsyArXiv, medRxiv, and arXiv. Studies published between December 2022 and February 2024 were included. The search query was “((“large language models”) OR (llms) OR (gpt) OR (chatgpt)) AND ((empathy) OR (“emotional awareness”) OR (“emotional intelligence”) OR (emotion)) OR ((“social robots”) OR (“artificial emotional intelligence”) OR (“emotional artificial intelligence”) OR (“emotional chatbots”) OR (“affective computing”) OR (HRI) OR (“Human robot interaction”)).” We also searched the references lists of relevant studies, including some key studies from major medical journals, for any additional studies that may have been missed during the initial search.</p>
      <p>The inclusion and exclusion criteria are detailed in <xref ref-type="table" rid="table1">Table 1</xref>. Two reviewers (VS and EK) independently performed the search and screened the titles and abstract of the articles resulting from the search. Differences in search results were resolved through discussion to reach a consensus. The reviewers then screened selected articles’ full text for final inclusion. Ultimately, 12 publications were included in this review. The results of the included studies including the LLMs used, performance in empathy tasks, and limitations of the models, along with studies’ publication details, authors, and other relevant information were systematically summarized in a table.</p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>Inclusion and exclusion criteria. This table outlines the inclusion and exclusion criteria applied to select studies for this review for evaluating empathy within large language models.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="150"/>
          <col width="350"/>
          <col width="500"/>
          <thead>
            <tr valign="top">
              <td>Criteria</td>
              <td>Inclusion</td>
              <td>Exclusion</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Article type</td>
              <td>Full-length original articles</td>
              <td>Nonoriginal articles including but not limited to perspectives, opinions, and reviews</td>
            </tr>
            <tr valign="top">
              <td>Language</td>
              <td>English</td>
              <td>Non-English</td>
            </tr>
            <tr valign="top">
              <td>Focus of study</td>
              <td>Articles that evaluated empathy within LLMs'<sup>a</sup> outputs</td>
              <td>Studies focusing only on emotion recognition or theory of mind, without explicit empathy evaluation</td>
            </tr>
            <tr valign="top">
              <td>Model</td>
              <td>Only LLMs<sup>a</sup></td>
              <td>Any other NLP<sup>b</sup> algorithms</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table1fn1">
            <p><sup>a</sup>LLM: large language model.</p>
          </fn>
          <fn id="table1fn2">
            <p><sup>b</sup>NLP: natural language processing.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p><xref rid="figure1" ref-type="fig">Figure 1</xref> presents a flow diagram of the screening and inclusion process. All 12 studies included in this review were published in 2023. Six studies compared ChatGPT-3.5 with other LLMs including GPT-4, versions of LLaMA, and fine-tuned chatbots. Six studies evaluated only ChatGPT-3.5. Seven studies evaluated empathy in ChatGPT in medical context. The results of the studies included are summarized in <xref ref-type="table" rid="table2">Table 2</xref><italic>.</italic> This table provides a detailed summary of studies included in this review that evaluate aspects of empathy exhibited by large language models. The table outlines each study’s objectives, the specific large language model used key findings from the evaluations, sample sizes, and the methods used to assess empathy. It also highlights whether the reviewers were blinded to whether responses came from large language models or humans. The limitations of the LLMs as detailed in the different studies are detailed in Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
      <fig id="figure1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>Flow diagram of the inclusion process based on the PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) guidelines.</p>
        </caption>
        <graphic xlink:href="jmir_v26i1e52597_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <table-wrap position="float" id="table2">
        <label>Table 2</label>
        <caption>
          <p>Overview of studies evaluating empathy in large language models.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="90"/>
          <col width="130"/>
          <col width="100"/>
          <col width="200"/>
          <col width="130"/>
          <col width="180"/>
          <col width="170"/>
          <thead>
            <tr valign="top">
              <td>Study</td>
              <td>Objective</td>
              <td>LLM<sup>a</sup></td>
              <td>Key findings</td>
              <td>Sample size</td>
              <td>Methods for assessing empathy</td>
              <td>Reviewers were blinded to LLM versus human responses</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Webb [<xref ref-type="bibr" rid="ref23">23</xref>]</td>
              <td>Breaking bad news in emergency medicine</td>
              <td>ChatGPT-3.5</td>
              <td>ChatGPT facilitated realistic scenario design, active roleplay, and effective feedback through the application of the SPIKES<sup>b</sup> framework for breaking bad news.</td>
              <td>1 example</td>
              <td>Simulating a patient role in an emergency department setting</td>
              <td>No</td>
            </tr>
            <tr valign="top">
              <td>Ayers et al [<xref ref-type="bibr" rid="ref26">26</xref>]</td>
              <td>Empathetic responses to patient questions</td>
              <td>ChatGPT-3.5</td>
              <td>ChatGPT responses were preferred by evaluators over physicians in 78.6% evaluations and were rated of significantly higher quality and empathy.</td>
              <td>195 questions from social media</td>
              <td>Health care professionals rated LLM and physician responses</td>
              <td>Yes</td>
            </tr>
            <tr valign="top">
              <td>Chen et al [<xref ref-type="bibr" rid="ref27">27</xref>]</td>
              <td>Simulating psychiatrists and patients in clinical psychiatric scenarios, and evaluating the expression of empathy in the interactions</td>
              <td>Chatbots based on ChatGPT</td>
              <td>ChatGPT-powered chatbots showed feasibility in simulating some aspects of empathy in psychiatric interactions, achieving a score of up to 3.43/4 when evaluated by humans for empathetic responses.</td>
              <td>14 patients and 11 psychiatrists interacting with an LLM<sup>a</sup></td>
              <td>The participants interacted with the chatbots and scored their responses for empathy</td>
              <td>No</td>
            </tr>
            <tr valign="top">
              <td>Zhao et al [<xref ref-type="bibr" rid="ref30">30</xref>]</td>
              <td>Evaluate emotional dialogue understanding and generation and compare it with other supervised models</td>
              <td>ChatGPT-3.5</td>
              <td>Supervised models surpassed ChatGPT in emotion recognition. ChatGPT produced longer responses, but responses were also more specific to the context of the conversation compared with other models. When evaluating empathy within responses, humans preferred ChatGPT responses over EmpSOA in 54.33% of cases. When compared with MISC however, ChatGPT responses were preferred in 16% of cases.</td>
              <td>100</td>
              <td>3 readers rated the responses of different models for empathy</td>
              <td>No</td>
            </tr>
            <tr valign="top">
              <td>Yeo et al [<xref ref-type="bibr" rid="ref31">31</xref>]</td>
              <td>Emotional support for patients with cirrhosis and those with HCC<sup>c</sup> </td>
              <td>ChatGPT-3.5</td>
              <td>ChatGPT emulated empathetic responses and offered actionable recommendations for patients and caregivers.</td>
              <td>4 prompts with 4 scenarios related to emotional support</td>
              <td>The authors’ subjective description and assessment</td>
              <td>No</td>
            </tr>
            <tr valign="top">
              <td>Elyoseph et al [<xref ref-type="bibr" rid="ref28">28</xref>]</td>
              <td>Emotional awareness performance compared with the general population norms</td>
              <td>ChatGPT-3.5</td>
              <td>ChatGPT demonstrated significantly higher emotional awareness performance than general population norms, with improvements over time. LEAS<sup>d</sup> scores were significantly higher than those of the general population (both men’s and women’s), on all the scales.</td>
              <td>20 scenarios</td>
              <td>LEAS compared with the general population norms. Two psychologists assessed the responses</td>
              <td>No</td>
            </tr>
            <tr valign="top">
              <td>Liu et al [<xref ref-type="bibr" rid="ref32">32</xref>]</td>
              <td>Fine-tuning an LLM to generate responses to patient questions</td>
              <td>LLM based on LLaMA-65B; ChatGPT-3.5, GPT-4</td>
              <td>GPT-4 and ChatGPT-3.5 outperformed the fine-tuned model. Both ChatGPT models and a fine-tuned LLaMA outperformed physician-generated responses.</td>
              <td>10 questions</td>
              <td>Physicians rated the responses of the chatbots and actual health care provider responses</td>
              <td>Yes</td>
            </tr>
            <tr valign="top">
              <td>Brin et al [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
              <td>Evaluate ChatGPT and GPT-4 on USMLE<sup>e</sup> soft-skill questions</td>
              <td>ChatGPT, GPT-4</td>
              <td>GPT-4 correctly answered 90% of questions, outperforming ChatGPT and humans.</td>
              <td>80 multiple-choice USMLE soft skills questions</td>
              <td>Correctness of responses and comparison of ChatGPT and GPT-4 performance to that of past users from the AMBOSS question bank</td>
              <td>No</td>
            </tr>
            <tr valign="top">
              <td>Huang et al [<xref ref-type="bibr" rid="ref34">34</xref>]</td>
              <td>Evaluate emotional responses to various situations</td>
              <td> Text-davinci-003 (a variant of GPT-3), GPT-3.5-turbo, GPT-4, LLaMA-2 7B and LLaMA-2 13B</td>
              <td>The different LLMs generally demonstrate appropriate emotional responses. None of the models exhibit strong alignment with human references.</td>
              <td>400 situations</td>
              <td>Measuring the change in LLMs’ different evoked emotions (overall 8 negative emotions) in response to situations compared with human benchmark</td>
              <td>No</td>
            </tr>
            <tr valign="top">
              <td>Chen et al [<xref ref-type="bibr" rid="ref25">25</xref>]</td>
              <td>Evaluate empathy, listening and comfort abilities of a fine-tuned LLM, compared with other LLMs</td>
              <td>SoulChat, ChatGLM-6B, ChatGPT, MeChat</td>
              <td>The fine-tuned model (SoulChat) outperformed the 3 other models in automatic metrics (ROUGE<sup>f</sup> and BLEU<sup>g</sup>), and based on human evaluation. The mean empathy score ranged between 1.84-1.90 (on a scale of 0-2), compared with 1.62-1.65 for ChatGPT.</td>
              <td>10,000 samples for automatic evaluation and 100 samples for manual evaluation</td>
              <td>Automatic evaluation tools were used, as well as manual rating by three experts in psychology</td>
              <td>No</td>
            </tr>
            <tr valign="top">
              <td>Belkhir and Sadat [<xref ref-type="bibr" rid="ref35">35</xref>]</td>
              <td>Evaluate whether prompt engineering and an external emotion classifier can improve ChatGPT’s empathetic responses</td>
              <td>ChatGPT</td>
              <td>Prompt engineering and the use of an external emotion classifier improved ChatGPT performance, increasing accuracy for emotion labeling from 28.64% to 39.55%.</td>
              <td>25,000 human dialogues</td>
              <td>Labeling dialogues with emotion labels</td>
              <td>No</td>
            </tr>
            <tr valign="top">
              <td>Qian et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
              <td>Evaluate the performance of LLMs in generating empathetic responses compared with other deep learning available models</td>
              <td>GPT-3, GPT-3.5, ChatGPT</td>
              <td>ChatGPT outperformed the other models in empathetic response generation, with a mean score of 4.64 (on a scale of 1-5).</td>
              <td>100 dialogues for human evaluation</td>
              <td>Automatic evaluation tools and three human raters</td>
              <td> No</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table2fn1">
            <p><sup>a</sup>LLMs: large language models.</p>
          </fn>
          <fn id="table2fn2">
            <p><sup>b</sup>SPIKES: Setting up, Perception, Invitation, Knowledge, Emotions with Empathy, and Strategy or Summary.</p>
          </fn>
          <fn id="table2fn3">
            <p><sup>c</sup>HCC: hepatocellular carcinoma.</p>
          </fn>
          <fn id="table2fn4">
            <p><sup>d</sup>LEAS: Levels of Emotional Awareness Scale.</p>
          </fn>
          <fn id="table2fn5">
            <p><sup>e</sup>USMLE: United States Medical Licensing Examination.</p>
          </fn>
          <fn id="table2fn6">
            <p><sup>f</sup>ROUGE: Recall-Oriented Understudy for Gisting Evaluation.</p>
          </fn>
          <fn id="table2fn7">
            <p><sup>g</sup>BLEU: Bilingual Evaluation Understudy.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <p>Empathy is essential in medicine, particularly when breaking bad news to patients. It allows physicians to deliver difficult information in a manner that respects the patient’s emotions and perspective. Webb [<xref ref-type="bibr" rid="ref23">23</xref>] used ChatGPT to simulate a role play for breaking bad news in the emergency department. The chatbot successfully set up a training scenario, role played as a patient and provided clear feedback through the application of the SPIKES (Setting up, Perception, Invitation, Knowledge, Emotions with Empathy, and Strategy or Summary) framework for breaking bad news [<xref ref-type="bibr" rid="ref23">23</xref>]. In another study, Yeo et al [<xref ref-type="bibr" rid="ref31">31</xref>] tested ChatGPT’s ability to provide emotional support to patients diagnosed with hepatocellular carcinoma, and their caregivers. ChatGPT was able to acknowledge the likely emotional response of the patient to their diagnosis. Furthermore, the chatbot provided clear and actionable starting points for a newly diagnosed patient and offered motivational responses encouraging proactive steps. For caregivers, ChatGPT provided psychological and practical recommendations [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
      <p>Ayers et al [<xref ref-type="bibr" rid="ref26">26</xref>] compared the quality and empathy of responses given by ChatGPT and physicians with 195 randomly drawn patient questions from a social media forum. The study found that patients preferred the chatbot’s responses over physician responses in 78.6% of cases. ChatGPT’s responses were rated significantly higher for both quality and empathy, while physician responses were 41% less empathetic than the chatbot responses. The authors noted that ChatGPT tended to provide more lengthy responses, which could potentially be erroneously associated with greater empathy. They concluded that the chatbot may have potential in aiding drafting responses to patient questions [<xref ref-type="bibr" rid="ref26">26</xref>].</p>
      <p>Another study also assessed empathy in chatbot’s responses to patient’s questions. Liu et al [<xref ref-type="bibr" rid="ref32">32</xref>] developed a model based on a pretrained LLaMA-65B and finetuned to generate physician-like responses that are professional and empathetic. They evaluated the model on 10 actual patient questions in primary care and compared the responses with those generated by ChatGPT-3.5 and GPT-4, rating them based on empathy, responsiveness, accuracy, and usefulness. When evaluating empathy, GPT-4 and ChatGPT-3.5 outperformed their model. Interestingly, all language models outperformed physician-generated responses significantly [<xref ref-type="bibr" rid="ref32">32</xref>].</p>
      <p>Understanding and addressing patients’ emotions is fundamental in mental health. Chen et al [<xref ref-type="bibr" rid="ref27">27</xref>] used ChatGPT-powered chatbots to simulate psychiatrists and patients in clinical psychiatric scenarios. The chatbots showed potential in simulating some aspects of empathy. However, they sometimes forgot initial instructions and repeated general empathy phrases too often. They also asked fewer in-depth questions about symptoms compared with physicians, potentially affecting their ability to fully understand the patient’s condition. When simulating patients, the chatbots reported symptoms inaccurately [<xref ref-type="bibr" rid="ref27">27</xref>].</p>
      <p>The Levels of Emotional Awareness Scale (LEAS) is a psychological tool that assesses an individual’s capacity to identify and describe emotions in themselves and others, a fundamental aspect of empathy [<xref ref-type="bibr" rid="ref37">37</xref>]. Elyoseph et al [<xref ref-type="bibr" rid="ref28">28</xref>] compared the LEAS score of ChatGPT to the general population norms. They found that ChatGPT demonstrated significantly higher emotional awareness performance. When repeating the test following 1 month interval, the chatbot’s performance further improved, almost reaching the maximum possible LEAS score. The authors propose that ChatGPT could be helpful for cognitive training of people with emotional awareness impairment, as well as for psychiatric assessment support [<xref ref-type="bibr" rid="ref28">28</xref>].</p>
      <p>Zhao et al [<xref ref-type="bibr" rid="ref30">30</xref>] compared ChatGPT with supervised models in terms of emotional dialogue understanding and generation. The tasks they assessed included emotion recognition, emotion cause recognition, dialog act classification, empathetic response generation, and emotional support conversation. The authors found that while supervised models surpassed ChatGPT in emotion recognition, ChatGPT produced longer, more diverse, and context-specific responses, especially when interacting with users in negative emotional states. Interestingly, Zhao et al [<xref ref-type="bibr" rid="ref30">30</xref>] also observed a repetitive pattern in ChatGPT’s empathy expressions, similar to the results described by Chen et al [<xref ref-type="bibr" rid="ref27">27</xref>].</p>
      <p>Brin et al [<xref ref-type="bibr" rid="ref33">33</xref>] evaluated ChatGPT and GPT-4 on USMLE (United States Medical Licensing Examination) questions involving communication skills, ethics, empathy, and professionalism. They have used questions from the USMLE website and the AMBOSS question bank and compared the performance of the LLMs with the reported performance at the AMBOSS website. GPT-4 correctly answered 90% of questions, outperforming ChatGPT and humans [<xref ref-type="bibr" rid="ref33">33</xref>]. Huang et al [<xref ref-type="bibr" rid="ref34">34</xref>] evaluated emotional responses of 5 different LLMs to various situations designed to evoke emotions, The LLMs’ responses were compared with human responses collected from 1266 participants worldwide. The authors reported for each model the changes in emotion scores relative to human benchmarks. They conclude that the different LLMs generally demonstrate appropriate emotional responses. However, none of the models exhibited strong alignment with human references. GPT-3.5-turbo demonstrated the highest alignment in the scores after imagining being in the situations. The 13B version of LLaMA-2 exhibited the strongest comprehension of human emotions.</p>
      <p>Chen et al [<xref ref-type="bibr" rid="ref25">25</xref>] constructed an empathetic conversation dataset of over 2 million samples and used it to fine-tune an LLM to provide empathetic responses. Their finetuned LLM outperformed other LLMs including ChatGPT in responses’ coherence and relevancy, as well as empathy, helpfulness and safety.</p>
      <p>Blekhir and Sadat [<xref ref-type="bibr" rid="ref35">35</xref>] evaluated whether prompt engineering and external emotion classifier can enhance empathy in ChatGPT’s responses. The study evaluated 2 versions of ChatGPT: 1 incorporating user emotions with an emotion classifier and another adapting to emotions without external tools. They evaluated these versions against the standard ChatGPT, demonstrating that tailored emotional responses significantly improve ChatGPT’s empathetic capabilities [<xref ref-type="bibr" rid="ref35">35</xref>].</p>
      <p>Qian et al [<xref ref-type="bibr" rid="ref36">36</xref>] evaluated ChatGPT compared with other deep-learning models trained for empathetic interactions. They also propose 3 improvement methods including semantically similar in-context learning, 2-stage interactive generation, and combination with knowledge base. These methods improved the quality of responses generated by ChatGPT, which outperformed other models evaluated [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
      <p>Lee et al [<xref ref-type="bibr" rid="ref38">38</xref>] used Chain-of-Empathy prompting to reason emotion and situational factors that may assist the model to infer the emotional experience. They evaluated GPT-3.5 and compared 4 unique prompts that used Chain-of-Empathy in generating empathetic responses to Reddit posts. The Chain-of-Empathy strategy resulted in improved the model’s empathy expression [<xref ref-type="bibr" rid="ref38">38</xref>].</p>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This review shows that LLMs demonstrate aspects of cognitive empathy, including recognition of emotions, and generation of emotionally supportive responses. Most studies focused on LLMs’ performance in medical contexts, assessing their ability to provide empathetic responses in clinical and nonclinical scenarios. Notable, LLMs were reported in the majority of the studies to perform comparably or even surpass human responses in certain empathy-related tasks. The review also identifies limitations, including the subjective nature of empathy evaluation, the risk of overestimating empathy due to lengthier responses, and the models’ inherent lack of emotional experience.</p>
      </sec>
      <sec>
        <title>Empathy and Social Intelligence in LLMs</title>
        <p>LLMs have shown impressive abilities in semantic understanding and logical reasoning [<xref ref-type="bibr" rid="ref5">5</xref>]. The ability of LLMs to emulate empathy, especially cognitive empathy, mirrors the growing body of research demonstrating that artificial intelligence can replicate certain aspects of social intelligence. This review supports the idea that LLMs may demonstrate some abilities that resemble social intelligence. Theory of mind involves the understanding of others’ thoughts and emotions, and predicting or explaining their behaviors based on these inferences. This concept is fundamental to social interactions, and it is a complex task, as it involves understanding not just the literal meaning of words in a conversation, but the underlying intentions, beliefs, and emotions [<xref ref-type="bibr" rid="ref39">39</xref>]. Several studies evaluated LLMs on theory of mind tasks, with varied performance, depending on the tasks and the models used [<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>].</p>
      </sec>
      <sec>
        <title>Cognitive Versus Affective Perspectives</title>
        <p>The definition of empathy varies among researchers and practitioners in social sciences [<xref ref-type="bibr" rid="ref1">1</xref>]. One of the debates is whether it is a cognitive or affective concept, and most definitions of empathy include both [<xref ref-type="bibr" rid="ref1">1</xref>]. Cognitive empathy involves the ability to understand another’s feelings, closely related to theory of mind [<xref ref-type="bibr" rid="ref3">3</xref>]. Affective empathy relates to experiencing emotions in response to an emotional stimulus [<xref ref-type="bibr" rid="ref1">1</xref>]. The ability of LLMs to demonstrate empathy in various fields as highlighted in this review, seems to align more with the cognitive aspect. It is nevertheless surprising that in some cases the LLM outperformed humans in empathy-related tasks.</p>
        <p>Research suggests that cognitive and affective empathy are distinct. For instance, people with autism often struggle with cognitive empathy but have normal levels of affective empathy, while psychopathic individuals typically show the reverse pattern [<xref ref-type="bibr" rid="ref3">3</xref>]. Neurological studies demonstrated distinct brain regions associated with each type of empathy, which further supports this notion [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref42">42</xref>]. It is worth questioning if demonstrating cognitive empathy alone is sufficient, or whether affective empathy is imperative for achieving human-like emotional intelligence.</p>
        <p>Historically, empathy has been viewed as a uniquely human trait, with definitions focused on interactions between humans [<xref ref-type="bibr" rid="ref1">1</xref>]. The complexity of empathy, influenced by personality, culture, and context, has led to ambiguous definitions of the term [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. Empathy exhibited by AI fundamentally differs from human empathy because an algorithm does not engage in a human’s emotional experience. Consequently, human-centric definitions of empathy may not apply to LLMs. This warrants a reevaluation of how empathy is measured. The question arises whether observable responses alone can be considered empathetic if they meet human expectations or preferences. If humans cannot distinguish between responses generated by humans and LLMs, or if they prefer AI-generated responses as demonstrated in the study by Ayers et al [<xref ref-type="bibr" rid="ref26">26</xref>], perhaps emulating such empathy may be sufficient.</p>
      </sec>
      <sec>
        <title>Implications in Health Care</title>
        <p>Numerous studies support the remarkable performance of LLMs in clinical reasoning [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. These models can be applied to enhance the medical care patients receive, while decreasing the workload of health care providers [<xref ref-type="bibr" rid="ref43">43</xref>]. Yet, empathy is a key factor in patient care. Empathy in health care communication is linked to improved patient satisfaction, adherence to treatment plans, and better outcomes [<xref ref-type="bibr" rid="ref4">4</xref>]. It allows for a more nuanced understanding of patients’ emotional states and experiences, facilitating more compassionate and person-centered care. As such, the ability of LLMs to integrate empathy can significantly enhance the role of AI in health care, for both patients and health care providers.</p>
        <p>Empathy in health care aligns more with cognitive rather than affective empathy, involving the ability to understand the pain and suffering of patients, and the capability to communicate this understanding [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]. Using this perspective, tools like the Jefferson Scale can assess empathy within health care settings [<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref46">46</xref>]. There may be scenarios where LLMs might demonstrate more fitting empathy, especially in contexts where cognitive empathy is predominant. However, the lack of standardized methods for assessing empathy in LLMs, as also seen in this review, challenges the ability to compare their empathetic capacities across different models and tasks.</p>
        <p>Furthermore, LLMs’ empathy is influenced by cultural factors, norms, and contexts, affecting how empathy is perceived by individuals from diverse backgrounds. Awareness of interacting with an AI could bias perceptions of empathy, potentially undermining its authenticity [<xref ref-type="bibr" rid="ref47">47</xref>]. Conversely, LLMs possess the potential to overcome cultural divides, offering empathetic responses appropriate across various backgrounds.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>This review has several limitations. First, as all but 1 study evaluated empathy based on subjective assessment, we could not perform a meta-analysis. Second, we only assessed studies directly discussing empathy, while there are many more that evaluate theory of mind tasks that are closely related to “cognitive” empathy. Third, all studies assessed ChatGPT-3.5, and only 1 study evaluated a model based on LLaMA and GPT-4. This can potentially limit the generalizability of findings to other LLMs. It is possible that alternative LLMs may present different empathy characteristics. Furthermore, LLMs are evolving fast, and possibly newer LLMs will present higher cognitive-like abilities.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>To conclude, this review demonstrates that LLMs exhibit elements of cognitive empathy, being able to recognize emotions and provide emotionally supportive responses in various contexts. Given that social skills are foundational to the concept of “intelligence,” further research is warranted to further develop that aspect in AI. The ability to simulate empathetic responses could enhance patient experiences, improving patient satisfaction and adherence to treatment plans. However, there remain critical questions regarding whether LLMs’ cognitive empathy is sufficient in scenarios that require deeper emotional engagement. Ultimately, as we continue to refine these models, we approach closer to bridging the gap between artificial and human-like interactions, opening opportunities for empathetic AI applications.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Supplemental Table 1. Limitation of Large Language Models Detailed in the Studies Included.</p>
        <media xlink:href="jmir_v26i1e52597_app1.docx" xlink:title="DOCX File , 18 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) checklist.</p>
        <media xlink:href="jmir_v26i1e52597_app2.pdf" xlink:title="PDF File  (Adobe PDF File), 82 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">LEAS</term>
          <def>
            <p>Levels of Emotional Awareness Scale</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">SPIKES</term>
          <def>
            <p>Setting up, Perception, Invitation, Knowledge, Emotions with Empathy, and Strategy or Summary</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">USMLE</term>
          <def>
            <p>United States Medical Licensing Examination</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>Data extracted from the studies are available in <xref ref-type="table" rid="table1">Table 2</xref>, and upon request from authors.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cuff</surname>
              <given-names>BMP</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Howat</surname>
              <given-names>DJ</given-names>
            </name>
          </person-group>
          <article-title>Empathy: A review of the concept</article-title>
          <source>Emotion Review</source>
          <year>2014</year>
          <volume>8</volume>
          <issue>2</issue>
          <fpage>144</fpage>
          <lpage>153</lpage>
          <pub-id pub-id-type="doi">10.1177/1754073914558466</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hajibabaee</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>A Farahani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ameri</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Salehi</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Hosseini</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>The relationship between empathy and emotional intelligence among Iranian nursing students</article-title>
          <source>Int J Med Educ</source>
          <year>2018</year>
          <volume>9</volume>
          <fpage>239</fpage>
          <lpage>243</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30244237"/>
          </comment>
          <pub-id pub-id-type="doi">10.5116/ijme.5b83.e2a5</pub-id>
          <pub-id pub-id-type="medline">30244237</pub-id>
          <pub-id pub-id-type="pii">ijme.9.239243</pub-id>
          <pub-id pub-id-type="pmcid">PMC6387768</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blair</surname>
              <given-names>RJR</given-names>
            </name>
          </person-group>
          <article-title>Fine cuts of empathy and the amygdala: dissociable deficits in psychopathy and autism</article-title>
          <source>Q J Exp Psychol (Hove)</source>
          <year>2008</year>
          <volume>61</volume>
          <issue>1</issue>
          <fpage>157</fpage>
          <lpage>170</lpage>
          <pub-id pub-id-type="doi">10.1080/17470210701508855</pub-id>
          <pub-id pub-id-type="medline">18038346</pub-id>
          <pub-id pub-id-type="pii">787077598</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moudatsou</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stavropoulou</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Philalithis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Koukouli</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>The role of empathy in health and social care professionals</article-title>
          <source>Healthcare (Basel)</source>
          <year>2020</year>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>26</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=healthcare8010026"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/healthcare8010026</pub-id>
          <pub-id pub-id-type="medline">32019104</pub-id>
          <pub-id pub-id-type="pii">healthcare8010026</pub-id>
          <pub-id pub-id-type="pmcid">PMC7151200</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sallam</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT utility in healthcare education, research, and practice: systematic review on the promising perspectives and valid concerns</article-title>
          <source>Healthcare (Basel)</source>
          <year>2023</year>
          <volume>11</volume>
          <issue>6</issue>
          <fpage>887</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=healthcare11060887"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/healthcare11060887</pub-id>
          <pub-id pub-id-type="medline">36981544</pub-id>
          <pub-id pub-id-type="pii">healthcare11060887</pub-id>
          <pub-id pub-id-type="pmcid">PMC10048148</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sorin</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Klang</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Sklair-Levy</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Zippel</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Balint Lahat</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Konen</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Barash</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Large language model (ChatGPT) as a support tool for breast tumor board</article-title>
          <source>NPJ Breast Cancer</source>
          <year>2023</year>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>44</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41523-023-00557-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41523-023-00557-8</pub-id>
          <pub-id pub-id-type="medline">37253791</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41523-023-00557-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC10229606</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Barash</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Klang</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Konen</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Sorin</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT-4 assistance in optimizing emergency department radiology referrals and imaging selection</article-title>
          <source>J Am Coll Radiol</source>
          <year>2023</year>
          <volume>20</volume>
          <issue>10</issue>
          <fpage>998</fpage>
          <lpage>1003</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jacr.2023.06.009</pub-id>
          <pub-id pub-id-type="medline">37423350</pub-id>
          <pub-id pub-id-type="pii">S1546-1440(23)00484-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="web">
          <source>Cool stuff now: epic and generative AI</source>
          <year>2023</year>
          <access-date>2024-08-13</access-date>
          <publisher-name>Epic</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.epic.com/epic/post/cool-stuff-now-epic-and-generative-ai/">https://tinyurl.com/4xvcjbh5</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="web">
          <source>Microsoft and epic expand strategic collaboration with integration of azure openAI service</source>
          <year>2023</year>
          <access-date>2024-08-17</access-date>
          <publisher-name>Epic</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.epic.com/epic/post/microsoft-and-epic-expand-strategic-collaboration-with-integration-of-azure-openai-service/">https://www.epic.com/epic/post/microsoft-and-epic-expand-strategic-collaboration-with-integration-of-azure-openai-service/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Clusmann</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kolbinger</surname>
              <given-names>FR</given-names>
            </name>
            <name name-style="western">
              <surname>Muti</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Carrero</surname>
              <given-names>ZI</given-names>
            </name>
            <name name-style="western">
              <surname>Eckardt</surname>
              <given-names>JN</given-names>
            </name>
            <name name-style="western">
              <surname>Laleh</surname>
              <given-names>NG</given-names>
            </name>
            <name name-style="western">
              <surname>Löffler</surname>
              <given-names>CML</given-names>
            </name>
            <name name-style="western">
              <surname>Schwarzkopf</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Unger</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Veldhuizen</surname>
              <given-names>GP</given-names>
            </name>
            <name name-style="western">
              <surname>Wagner</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kather</surname>
              <given-names>JN</given-names>
            </name>
          </person-group>
          <article-title>The future landscape of large language models in medicine</article-title>
          <source>Commun Med (Lond)</source>
          <year>2023</year>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>141</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s43856-023-00370-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s43856-023-00370-1</pub-id>
          <pub-id pub-id-type="medline">37816837</pub-id>
          <pub-id pub-id-type="pii">10.1038/s43856-023-00370-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC10564921</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>JCL</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>SYH</given-names>
            </name>
            <name name-style="western">
              <surname>William</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Butte</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NH</given-names>
            </name>
            <name name-style="western">
              <surname>Chew</surname>
              <given-names>LST</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Doshi-Velez</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Savulescu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ting</surname>
              <given-names>DSW</given-names>
            </name>
          </person-group>
          <article-title>Medical ethics of large language models in medicine</article-title>
          <source>NEJM AI</source>
          <year>2024</year>
          <volume>1</volume>
          <issue>7</issue>
          <pub-id pub-id-type="doi">10.1056/aira2400038</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mehandru</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Miao</surname>
              <given-names>BY</given-names>
            </name>
            <name name-style="western">
              <surname>Almaraz</surname>
              <given-names>ER</given-names>
            </name>
            <name name-style="western">
              <surname>Sushil</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Butte</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Alaa</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Evaluating large language models as agents in the clinic</article-title>
          <source>NPJ Digit Med</source>
          <year>2024</year>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>84</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-024-01083-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-024-01083-y</pub-id>
          <pub-id pub-id-type="medline">38570554</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-024-01083-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC10991271</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Freyer</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Wiest</surname>
              <given-names>IC</given-names>
            </name>
            <name name-style="western">
              <surname>Kather</surname>
              <given-names>JN</given-names>
            </name>
            <name name-style="western">
              <surname>Gilbert</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A future role for health applications of large language models depends on regulators enforcing safety standards</article-title>
          <source>Lancet Digit Health</source>
          <year>2024</year>
          <volume>6</volume>
          <issue>9</issue>
          <fpage>e662</fpage>
          <lpage>e672</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2589-7500(24)00124-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S2589-7500(24)00124-9</pub-id>
          <pub-id pub-id-type="medline">39179311</pub-id>
          <pub-id pub-id-type="pii">S2589-7500(24)00124-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Omar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sorin</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Agbareia</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Apakama</surname>
              <given-names>DU</given-names>
            </name>
            <name name-style="western">
              <surname>Soroush</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sakhuja</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Freeman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Horowitz</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Richardson</surname>
              <given-names>LD</given-names>
            </name>
            <name name-style="western">
              <surname>Nadkarni</surname>
              <given-names>GN</given-names>
            </name>
            <name name-style="western">
              <surname>Klang</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Evaluating and addressing demographic disparities in medical large language models: a systematic review</article-title>
          <source>medRxiv</source>
          <year>2024</year>
          <fpage>2024</fpage>
          <pub-id pub-id-type="doi">10.1101/2024.09.09.24313295</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sorin</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Soffer</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Glicksberg</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Barash</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Konen</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Klang</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Adversarial attacks in radiology - A systematic review</article-title>
          <source>Eur J Radiol</source>
          <year>2023</year>
          <volume>167</volume>
          <fpage>111085</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ejrad.2023.111085</pub-id>
          <pub-id pub-id-type="medline">37699278</pub-id>
          <pub-id pub-id-type="pii">S0720-048X(23)00399-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ilicki</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>A framework for critically assessing ChatGPT and other large language artificial intelligence model applications in health care</article-title>
          <source>Mayo Clinic Proceedings: Digital Health</source>
          <year>2023</year>
          <volume>1</volume>
          <issue>2</issue>
          <fpage>185</fpage>
          <lpage>188</lpage>
          <pub-id pub-id-type="doi">10.1016/j.mcpdig.2023.03.006</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nashwan</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Abujaber</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Choudry</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Embracing the future of physician-patient communication: GPT-4 in gastroenterology</article-title>
          <source>Gastroenterology &#38; Endoscopy</source>
          <year>2023</year>
          <volume>1</volume>
          <issue>3</issue>
          <fpage>132</fpage>
          <lpage>135</lpage>
          <pub-id pub-id-type="doi">10.1016/j.gande.2023.07.004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>YX</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>ZM</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>JZ</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>NZ</given-names>
            </name>
            <name name-style="western">
              <surname>Long</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>GPT-4: The future of cosmetic procedure consultation?</article-title>
          <source>Aesthet Surg J</source>
          <year>2023</year>
          <volume>43</volume>
          <issue>8</issue>
          <fpage>NP670</fpage>
          <lpage>NP672</lpage>
          <pub-id pub-id-type="doi">10.1093/asj/sjad134</pub-id>
          <pub-id pub-id-type="medline">37154801</pub-id>
          <pub-id pub-id-type="pii">7156883</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carlbring</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hadjistavropoulos</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kleiboer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Andersson</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>A new era in internet interventions: the advent of Chat-GPT and AI-assisted therapist guidance</article-title>
          <source>Internet Interv</source>
          <year>2023</year>
          <volume>32</volume>
          <fpage>100621</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2214-7829(23)00021-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.invent.2023.100621</pub-id>
          <pub-id pub-id-type="medline">37273936</pub-id>
          <pub-id pub-id-type="pii">S2214-7829(23)00021-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC10235420</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kosinski</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Theory of mind may have spontaneously emerged in large language models</article-title>
          <source>Stanford Graduate School of Business</source>
          <year>2023</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.gsb.stanford.edu/faculty-research/working-papers/theory-mind-may-have-spontaneously-emerged-large-language-models"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moghaddam</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Honey</surname>
              <given-names>CJ</given-names>
            </name>
          </person-group>
          <article-title>Boosting theory-of-mind performance in large language models via prompting</article-title>
          <source>ArXiv</source>
          <comment>Preprint posted online on April 22, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2304.11490"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sap</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>LeBras</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Fried</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Neural theory-of-mind? on the limits of social intelligence in large lms</article-title>
          <source>arXiv:221013312</source>
          <year>2022</year>
          <pub-id pub-id-type="doi">10.18653/v1/2022.emnlp-main.248</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Webb</surname>
              <given-names>JJ</given-names>
            </name>
          </person-group>
          <article-title>Proof of concept: using ChatGPT to teach emergency physicians how to break bad news</article-title>
          <source>Cureus</source>
          <year>2023</year>
          <volume>15</volume>
          <issue>5</issue>
          <fpage>e38755</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37303324"/>
          </comment>
          <pub-id pub-id-type="doi">10.7759/cureus.38755</pub-id>
          <pub-id pub-id-type="medline">37303324</pub-id>
          <pub-id pub-id-type="pmcid">PMC10250131</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weizenbaum</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Empathic AI can’t get under the skin</article-title>
          <source>Nat Mach Intell</source>
          <year>2024</year>
          <volume>6</volume>
          <issue>5</issue>
          <fpage>495</fpage>
          <pub-id pub-id-type="doi">10.1038/s42256-024-00850-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xing</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Improving llms? empathy, listening, and comfort abilities through fine-tuning with multi-turn empathy conversations</article-title>
          <year>2023</year>
          <conf-name>Findings of the Association for Computational Linguistics: EMNLP 2023</conf-name>
          <conf-date>2023 December 10</conf-date>
          <conf-loc>Singapore</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/2023.findings-emnlp.83</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ayers</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Poliak</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dredze</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Leas</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Kelley</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Faix</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Goodman</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Longhurst</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Hogarth</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>Comparing physician and artificial intelligence chatbot responses to patient questions posted to a public social media forum</article-title>
          <source>JAMA Intern Med</source>
          <year>2023</year>
          <volume>183</volume>
          <issue>6</issue>
          <fpage>589</fpage>
          <lpage>596</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37115527"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamainternmed.2023.1838</pub-id>
          <pub-id pub-id-type="medline">37115527</pub-id>
          <pub-id pub-id-type="pii">2804309</pub-id>
          <pub-id pub-id-type="pmcid">PMC10148230</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>KQ</given-names>
            </name>
            <name name-style="western">
              <surname>Lan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>LLM-empowered chatbots for psychiatrist and patient simulation: application and evaluation</article-title>
          <source>ArXiv</source>
          <comment>Preprint posted online on May 23, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2305.13614"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Elyoseph</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Hadar-Shoval</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Asraf</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lvovsky</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT outperforms humans in emotional awareness evaluations</article-title>
          <source>Front Psychol</source>
          <year>2023</year>
          <volume>14</volume>
          <fpage>1199058</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37303897"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpsyg.2023.1199058</pub-id>
          <pub-id pub-id-type="medline">37303897</pub-id>
          <pub-id pub-id-type="pmcid">PMC10254409</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
          <source>LIV: pioneering AI in mental health through strategic partnerships</source>
          <year>2024</year>
          <access-date>2024-07-11</access-date>
          <publisher-name>Sheba Global</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://sheba-global.com/transforming-mental-health-care-with-ai-liv-the-next-step-in-psychiatric-innovation/">https://sheba-global.com/transforming-mental-health-care-with-ai-liv-the-next-step-in-psychiatric-innovation/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tong</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Qin</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Is ChatGPT Equipped with Emotional Dialogue Capabilities?</article-title>
          <source>ArXiv</source>
          <comment>Preprint posted online on April 19, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2304.09582"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yeo</surname>
              <given-names>YH</given-names>
            </name>
            <name name-style="western">
              <surname>Samaan</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>WH</given-names>
            </name>
            <name name-style="western">
              <surname>Ting</surname>
              <given-names>PS</given-names>
            </name>
            <name name-style="western">
              <surname>Trivedi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Vipani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ayoub</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Liran</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Spiegel</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kuo</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Assessing the performance of ChatGPT in answering questions regarding cirrhosis and hepatocellular carcinoma</article-title>
          <source>Clin Mol Hepatol</source>
          <year>2023</year>
          <volume>29</volume>
          <issue>3</issue>
          <fpage>721</fpage>
          <lpage>732</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36946005"/>
          </comment>
          <pub-id pub-id-type="doi">10.3350/cmh.2023.0089</pub-id>
          <pub-id pub-id-type="medline">36946005</pub-id>
          <pub-id pub-id-type="pii">cmh.2023.0089</pub-id>
          <pub-id pub-id-type="pmcid">PMC10366809</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>McCoy</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Carew</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Genkins</surname>
              <given-names>JZ</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Steitz</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Leveraging large language models for generating responses to patient messages</article-title>
          <source>medRxiv</source>
          <year>2023</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1101/2023.07.14.23292669"/>
          </comment>
          <pub-id pub-id-type="doi">10.1101/2023.07.14.23292669</pub-id>
          <pub-id pub-id-type="medline">37503263</pub-id>
          <pub-id pub-id-type="pii">2023.07.14.23292669</pub-id>
          <pub-id pub-id-type="pmcid">PMC10370222</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sorin</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Vaid</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Soroush</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Glicksberg</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Charney</surname>
              <given-names>AW</given-names>
            </name>
            <name name-style="western">
              <surname>Nadkarni</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Klang</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Comparing ChatGPT and GPT-4 performance in USMLE soft skill assessments</article-title>
          <source>Sci Rep</source>
          <year>2023</year>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>16492</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-023-43436-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-023-43436-9</pub-id>
          <pub-id pub-id-type="medline">37779171</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-023-43436-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC10543445</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Lam</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ren</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Jiao</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Lyu</surname>
              <given-names>MR</given-names>
            </name>
          </person-group>
          <article-title>Emotionally numb or empathetic? Evaluating how llms feel using emotionbench</article-title>
          <source>ArXiv</source>
          <comment>Preprint posted online on August 07, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2308.03656"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Belkhir</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sadat</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Beyond information: Is chatgpt empathetic enough?</article-title>
          <year>2023</year>
          <conf-name>Proceedings of the 14th International Conference on Recent Advances in Natural Language Processing</conf-name>
          <conf-date>2024 November 05</conf-date>
          <conf-loc>Bulgaria, Varna, Bulgaria,</conf-loc>
          <pub-id pub-id-type="doi">10.26615/978-954-452-092-2_018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Qian</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>WN</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Harnessing the power of large language models for empathetic response generation: empirical investigations and improvements</article-title>
          <source>arXiv:231005140</source>
          <year>2023</year>
          <pub-id pub-id-type="doi">10.18653/v1/2023.findings-emnlp.433</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lane</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Levels of emotional awareness: theory and measurement of a socio-emotional skill</article-title>
          <source>J Intell</source>
          <year>2021</year>
          <volume>9</volume>
          <issue>3</issue>
          <fpage>42</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=jintelligence9030042"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/jintelligence9030042</pub-id>
          <pub-id pub-id-type="medline">34449662</pub-id>
          <pub-id pub-id-type="pii">jintelligence9030042</pub-id>
          <pub-id pub-id-type="pmcid">PMC8395748</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>YK</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bae</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hahn</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Chain of empathy: enhancing empathetic response of large language models based on psychotherapy models</article-title>
          <source>ArXiv</source>
          <comment>Preprint posted online on November 02, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2311.04915"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bubeck</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chandrasekaran</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Eldan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gehrke</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Horvitz</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kamar</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>YT</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lundberg</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nori</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Palangi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ribeiro</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Sparks of artificial general intelligence: Early experiments with gpt-4</article-title>
          <source>ArXiv</source>
          <comment>Preprint posted online on March 22, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2303.12712"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Marchetti</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Di Dio</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cangelosi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Manzi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Massaro</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Developing ChatGPT's theory of mind</article-title>
          <source>Front Robot AI</source>
          <year>2023</year>
          <volume>10</volume>
          <fpage>1189525</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37377631"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/frobt.2023.1189525</pub-id>
          <pub-id pub-id-type="medline">37377631</pub-id>
          <pub-id pub-id-type="pii">1189525</pub-id>
          <pub-id pub-id-type="pmcid">PMC10292745</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shamay-Tsoory</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Aharon-Peretz</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Perry</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Two systems for empathy: a double dissociation between emotional and cognitive empathy in inferior frontal gyrus versus ventromedial prefrontal lesions</article-title>
          <source>Brain</source>
          <year>2009</year>
          <volume>132</volume>
          <issue>Pt 3</issue>
          <fpage>617</fpage>
          <lpage>627</lpage>
          <pub-id pub-id-type="doi">10.1093/brain/awn279</pub-id>
          <pub-id pub-id-type="medline">18971202</pub-id>
          <pub-id pub-id-type="pii">awn279</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zaki</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Weber</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bolger</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ochsner</surname>
              <given-names>KN</given-names>
            </name>
          </person-group>
          <article-title>The neural bases of empathic accuracy</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2009</year>
          <volume>106</volume>
          <issue>27</issue>
          <fpage>11382</fpage>
          <lpage>11387</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/19549849"/>
          </comment>
          <pub-id pub-id-type="doi">10.1073/pnas.0902666106</pub-id>
          <pub-id pub-id-type="medline">19549849</pub-id>
          <pub-id pub-id-type="pii">0902666106</pub-id>
          <pub-id pub-id-type="pmcid">PMC2708723</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sorin</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Barash</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Konen</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Klang</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Large language models for oncological applications</article-title>
          <source>J Cancer Res Clin Oncol</source>
          <year>2023</year>
          <volume>149</volume>
          <issue>11</issue>
          <fpage>9505</fpage>
          <lpage>9508</lpage>
          <pub-id pub-id-type="doi">10.1007/s00432-023-04824-w</pub-id>
          <pub-id pub-id-type="medline">37160626</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00432-023-04824-w</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hojat</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>Empathy in Health Professions Education and Patient Care</source>
          <year>2016</year>
          <publisher-loc>Cham</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hojat</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mangione</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nasca</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>MJM</given-names>
            </name>
            <name name-style="western">
              <surname>Gonnella</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Erdmann</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Veloski</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Magee</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The jefferson scale of physician empathy: development and preliminary psychometric data</article-title>
          <source>Educational and Psychological Measurement</source>
          <year>2001</year>
          <volume>61</volume>
          <issue>2</issue>
          <fpage>349</fpage>
          <lpage>365</lpage>
          <pub-id pub-id-type="doi">10.1177/00131640121971158</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hojat</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>DeSantis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shannon</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Mortensen</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Speicher</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Bragan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>LaNoue</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Calabrese</surname>
              <given-names>LH</given-names>
            </name>
          </person-group>
          <article-title>The jefferson scale of empathy: a nationwide study of measurement properties, underlying components, latent variable structure, and national norms in medical students</article-title>
          <source>Adv Health Sci Educ Theory Pract</source>
          <year>2018</year>
          <volume>23</volume>
          <issue>5</issue>
          <fpage>899</fpage>
          <lpage>920</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29968006"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s10459-018-9839-9</pub-id>
          <pub-id pub-id-type="medline">29968006</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10459-018-9839-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC6245107</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Morris</surname>
              <given-names>RR</given-names>
            </name>
            <name name-style="western">
              <surname>Kouddous</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kshirsagar</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Schueller</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>Towards an artificially empathic conversational agent for mental health applications: system design and user perceptions</article-title>
          <source>J Med Internet Res</source>
          <year>2018</year>
          <volume>20</volume>
          <issue>6</issue>
          <fpage>e10148</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2018/6/e10148/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/10148</pub-id>
          <pub-id pub-id-type="medline">29945856</pub-id>
          <pub-id pub-id-type="pii">v20i6e10148</pub-id>
          <pub-id pub-id-type="pmcid">PMC6039770</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
