<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v27i1e70971</article-id>
      <article-id pub-id-type="pmid">40540733</article-id>
      <article-id pub-id-type="doi">10.2196/70971</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Using Natural Language Processing to Explore Patient Perspectives on AI Avatars in Support Materials for Patients With Breast Cancer: Survey Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Sarvestan</surname>
            <given-names> Javad</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>García-Barragán</surname>
            <given-names>Álvaro</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Chrimes</surname>
            <given-names>Dillon</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Wang</surname>
            <given-names>Yvette</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Liao</surname>
            <given-names>Xin</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Meskó</surname>
            <given-names>Bertalan</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Cheese</surname>
            <given-names>Eleanor</given-names>
          </name>
          <degrees>MSci</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0005-1477-9507</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Bichoo</surname>
            <given-names>Raouef Ahmed</given-names>
          </name>
          <degrees>MBBS, MS, MCh</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9386-403X</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Grover</surname>
            <given-names>Kartikae</given-names>
          </name>
          <degrees>MBBS, MS</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0002-6151-7671</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Dumitru</surname>
            <given-names>Dorin</given-names>
          </name>
          <degrees>MS, MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4539-0017</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Zenonos</surname>
            <given-names>Alexandros</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4694-1642</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Groark</surname>
            <given-names>Joanne</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0005-7496-9695</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Gibson</surname>
            <given-names>Douglas</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0001-7599-3591</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Pope</surname>
            <given-names>Rebecca</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Roche Products Ltd UK</institution>
            <addr-line>Hexagon Place, 6 Falcon Way</addr-line>
            <addr-line>Shire Park</addr-line>
            <addr-line>Welwyn Garden City, AL7 1TW</addr-line>
            <country>United Kingdom</country>
            <phone>44 1707 366000</phone>
            <email>rebecca.pope@roche.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6889-589X</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Roche Products Ltd UK</institution>
        <addr-line>Welwyn Garden City</addr-line>
        <country>United Kingdom</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Hull University Teaching Hospital NHS Trust</institution>
        <addr-line>Hull</addr-line>
        <country>United Kingdom</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Rebecca Pope <email>rebecca.pope@roche.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2025</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>20</day>
        <month>6</month>
        <year>2025</year>
      </pub-date>
      <volume>27</volume>
      <elocation-id>e70971</elocation-id>
      <history>
        <date date-type="received">
          <day>8</day>
          <month>1</month>
          <year>2025</year>
        </date>
        <date date-type="rev-request">
          <day>21</day>
          <month>3</month>
          <year>2025</year>
        </date>
        <date date-type="rev-recd">
          <day>2</day>
          <month>5</month>
          <year>2025</year>
        </date>
        <date date-type="accepted">
          <day>21</day>
          <month>5</month>
          <year>2025</year>
        </date>
      </history>
      <copyright-statement>©Eleanor Cheese, Raouef Ahmed Bichoo, Kartikae Grover, Dorin Dumitru, Alexandros Zenonos, Joanne Groark, Douglas Gibson, Rebecca Pope. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 20.06.2025.</copyright-statement>
      <copyright-year>2025</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2025/1/e70971" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Having well-informed patients is crucial to enhancing patient satisfaction, quality of life, and health outcomes, which in turn optimizes health care use. Traditional methods of delivering information, such as booklets and leaflets, are often ineffective and can overwhelm patients. Educational videos represent a promising alternative; however, their production typically requires significant time and financial resources. Video production using generative artificial intelligence (AI) technology may provide a solution to this problem.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to use natural language processing (NLP) to understand free-text patient feedback on 1 of 7 AI-generated patient educational videos created in collaboration with Roche UK and the Hull University Teaching Hospitals NHS Trust breast cancer team, titled “Breast Cancer Follow Up Programme.”</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>A survey was sent to 400 patients who had completed the breast cancer treatment pathway, and 98 (24.5%) free-text responses were received for the question “Any comments or suggestions to improve its [the video’s] contents?” We applied and evaluated different NLP machine learning techniques to draw insights from these unstructured data, namely sentiment analysis, topic modeling, summarization, and term frequency–inverse document frequency word clouds.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Sentiment analysis showed that 81% (79/98) of the responses were positive or neutral, while negative comments were predominantly related to the AI avatar. Topic modeling using BERTopic with k-means clustering was found to be the most effective model and identified 4 key topics: the breast cancer treatment pathway, video content, the digital avatar or narrator, and short responses with little or no content. The term frequency–inverse document frequency word clouds indicated positive sentiment about the treatment pathway (eg, “reassured” and “faultless”) and video content (eg, “informative” and “clear”), whereas the AI avatar was often described negatively (eg, “impersonal”). Summarization using the text-to-text transfer transformer model effectively created summaries of the responses by topic.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This study demonstrates the success of NLP techniques in efficiently generating insights into patient feedback related to generative AI educational content. Combining NLP methods resulted in clear visuals and insights, enhancing the understanding of patient feedback. Analysis of free-text responses provided clinicians at Hull University Teaching Hospitals NHS Trust with deeper insights than those obtained from quantitative Likert scale responses alone. Importantly, the results validate the use of generative AI in creating patient educational videos, highlighting its potential to address the challenges of costly video production and the limitations of traditional, often overwhelming educational leaflets. Despite the positive overall feedback, negative comments focused on the technical aspects of the AI avatar, indicating areas for improvement. We advocate that patients who receive AI avatar explanations are counseled that this technology is intended to supplement, not replace, human health care interactions. Future investigations are needed to confirm the ongoing effectiveness of these educational tools.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>educational videos</kwd>
        <kwd>breast cancer</kwd>
        <kwd>natural language processing</kwd>
        <kwd>avatars</kwd>
        <kwd>patient feedback</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>AI</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Efforts to ensure that patients are well informed can improve patient satisfaction, quality of life, and health outcomes, which in turn optimizes health care use [<xref ref-type="bibr" rid="ref1">1</xref>]. However, traditional passive methods of delivering information to patients through booklets and leaflets can prove ineffective and overwhelm patients [<xref ref-type="bibr" rid="ref2">2</xref>]. Moreover, printed materials are fixed in their language delivery: in English-speaking health care settings, for example, they are typically produced in English, which may exclude patients who do not speak English or have visual impairment. Similarly, a person with good conversational fluency in English may not be able to understand, discuss, or read health-related information proficiently in English [<xref ref-type="bibr" rid="ref3">3</xref>], which can worsen health inequalities and outcomes [<xref ref-type="bibr" rid="ref4">4</xref>]. In England, this issue is further exacerbated by the ongoing workforce crisis in the National Health Service (NHS) [<xref ref-type="bibr" rid="ref5">5</xref>], leaving patients with breast cancer on treatment pathways struggling to access accurate and timely information.</p>
        <p>To address these challenges, innovative solutions are necessary to streamline health care professionals’ workloads, enabling them to focus their specialist skill set on patient care. One promising approach involves the use of patient educational videos. More specifically, with the rise of generative artificial intelligence (GenAI), it is now possible to quickly create these educational videos at low cost, using digital avatars to narrate tailored scripts and incorporating language preferences that meet the specific information needs of viewers.</p>
        <p>Hull University Teaching Hospitals NHS Trust (HUTH) experienced such pressures within their breast cancer service. Specialist breast cancer nurses were spending significant amounts of time on the telephone answering common patient queries on general topics (eg, “What happens at the end of my cancer treatment?” “What are the signs of recurrence that I need to look out for?” “Who do I contact if I have concerns?”), which diverted time away from addressing highly specialized, treatment-related questions. Being aware of the benefits of educational videos in mitigating this issue and in supporting shared decision-making in consultations, HUTH explored the process of making videos manually. However, this proved to be time consuming and expensive, and it was difficult to produce videos to professional standards. Recognizing this issue, Roche UK and HUTH identified an opportunity to pilot educational videos that leveraged GenAI to create digital avatars [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>], reducing the time and financial resources required to produce educational videos.</p>
        <p>The primary aim of this pilot was to streamline the breast cancer treatment pathway and collect feedback from patients on whether they felt that these digital avatars improved their experience. Seven educational videos were developed in collaboration with clinicians and breast surgeons, ensuring that the content was precisely tailored to the informational needs of patients with breast cancer at various stages of their health journey [<xref ref-type="bibr" rid="ref8">8</xref>]. The videos’ contents covered a range of topics, including the “Breast Cancer Follow Up Programme,” which outlined a patient’s journey after their cancer treatment.</p>
        <p>To assess the success of this initiative, a survey was sent via email to 400 HUTH patients who were in remission and who had participated in watching the “Breast Cancer Follow Up Programme” retrospectively. The survey included quantitative Likert scale questions as well as free-text open-ended questions. Analyzing free-text responses offers significant advantages over relying solely on insights from Likert scale responses because free-text responses allow patients to describe their experiences in their own words, providing deeper and more specific insights and context that closed-ended questions may miss. Furthermore, free-text responses can enable the identification of emerging themes in patient perspective, such as areas of concern, suggestions for improvement, or positive aspects [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. Therefore, the analysis of free-text responses is essential for understanding the nuances of patient experiences and for revealing actionable insights. However, free-text responses are often difficult to analyze in large quantities, especially in clinical settings, because clinical time is constrained, and it is often impractical for clinical staff to manually review survey feedback. Therefore, natural language processing (NLP) techniques were used to help draw insights and capture patient experiences from these data.</p>
        <p>The aim of this work was to analyze qualitative survey feedback received in free-text (unstructured) format for the video “Breast Cancer Follow Up Programme” [<xref ref-type="bibr" rid="ref8">8</xref>]. This video was selected due to the large number of patients who had experienced the breast cancer service.</p>
      </sec>
      <sec>
        <title>Prior Work</title>
        <p>Recent advancements in technology, particularly in AI and GenAI, have influenced efforts to improve patient care [<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref14">14</xref>]. GenAI has predominantly been applied in health care in areas such as screening and diagnosis, clinical administration support, decision support, professional medical education, and patient engagement chatbots [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. However, few studies have explored the use of GenAI to create patient educational videos or the subsequent application of traditional artificial intelligence (AI) methods, such as NLP, to understand patient preferences regarding this method of delivering patient education.</p>
        <p>Some health care providers have implemented GenAI to develop multilingual videos aimed at both health care professionals and patients [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. Notably, Adeboye et al [<xref ref-type="bibr" rid="ref19">19</xref>] explored the use of avatar-narrated videos to educate patients in postoperative wound care after breast surgery, with survey results indicating that 79% of the patients preferred this mode of content delivery over traditional leaflets. To our knowledge, our study is the first to use NLP techniques to analyze patient feedback on the use of GenAI videos.</p>
        <p>Patient centeredness is essential for high-quality care [<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref22">22</xref>], leading to a focus on integrating patient experiences and feedback into care delivery [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. Patient experience surveys often include closed-ended questions for quantitative insights and open-ended questions for richer, detailed feedback [<xref ref-type="bibr" rid="ref25">25</xref>]. While closed-ended questions are easier to analyze [<xref ref-type="bibr" rid="ref26">26</xref>], open-ended responses are valued higher by health care professionals for identifying important topics and providing context to the closed-ended questions [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. Gallan et al [<xref ref-type="bibr" rid="ref28">28</xref>] noted that survey comments can sometimes contradict qualitative results, emphasizing the need to consider both to fully understand patient experiences.</p>
        <p>Qualitative patient responses, although valuable, are often underused in clinical practice due to the effort required for manual analysis [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]. Data science techniques, particularly NLP, offer a solution by enabling efficient analysis of free-text responses [<xref ref-type="bibr" rid="ref30">30</xref>]; for instance, many studies use topic analysis, an NLP method that structures large text datasets into topics [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref35">35</xref>]. Common approaches include topic modeling, an unsupervised method in which algorithms identify topics; and topic classification, a supervised method in which texts are assigned to predefined topics. There are benefits and disadvantages to both approaches depending on the use case; however, in terms of topic quality, 2 studies have concluded similar results from both approaches [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>].</p>
        <p>Cammel et al [<xref ref-type="bibr" rid="ref38">38</xref>] applied unsupervised topic modeling to free-text patient experience data from 2 hospitals. Using nonnegative matrix factorization (NMF), the authors selected a model with the highest topic coherence, assigning 87% of the responses to topics. They noted the model’s transferability to data from other hospitals due to its unsupervised nature.</p>
        <p>Additional benefits of unsupervised models over supervised classification include reduced human bias because predefined categories are unnecessary. Conversely, Doing-Harris et al [<xref ref-type="bibr" rid="ref36">36</xref>] used a supervised approach, applying vocabulary-based and naive Bayes classifiers with 28 predefined topics adapted from the taxonomy of patient satisfaction themes proposed by López et al [<xref ref-type="bibr" rid="ref39">39</xref>], with naive Bayes performing better. The authors also applied topic modeling using latent Dirichlet allocation (LDA) to negative comments, which revealed no new topics, suggesting that accurate predefined topics can eliminate the need for topic discovery with unsupervised models.</p>
        <p>Sentiment analysis is another NLP technique commonly used in the analysis of patient survey responses [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref40">40</xref>], wherein a piece of text is assigned a score or likelihood indicating its sentiment as negative, neutral, or positive. The choice of a pretrained model is crucial because its decisions depend heavily on the training data. Cammel et al [<xref ref-type="bibr" rid="ref38">38</xref>] used the <italic>pattern.nl</italic> package (trained on product reviews) to categorize their patient data but faced issues related to domain specificity; for instance, “disease” was classified as negative when, in this context, it should have been classified as neutral. By contrast, van Buchem et al [<xref ref-type="bibr" rid="ref29">29</xref>] fine-tuned a pretrained bidirectional encoder representations from transformers (BERT) model with manually labeled data, achieving up to 97% accuracy.</p>
        <p>Combining NLP techniques can provide deeper insights; for example, Cammel et al [<xref ref-type="bibr" rid="ref38">38</xref>] combined topic analysis and frequency to create a matrix that categorized topics into “topics to improve” (frequently mentioned topics with negative sentiment), “topics to celebrate” (frequently mentioned topics with positive sentiment), and “topics to monitor” (frequently mentioned topics with neutral sentiment and infrequently mentioned topics with negative sentiment). Word clouds are another way of visualizing commonly occurring words and themes within patient responses. Khanbhai et al [<xref ref-type="bibr" rid="ref9">9</xref>] combined word clouds with topic analysis to reveal ideas by health care setting (eg, outpatient vs inpatient), whereas Nawab et al [<xref ref-type="bibr" rid="ref41">41</xref>] combined word clouds with sentiment analysis to show common complaints and compliments, with separate word clouds for negative and positive comments.</p>
        <p>Summarization, a subfield of NLP, has been a subject of study for several decades but has advanced rapidly and significantly in recent years, primarily due to the development of large language models (LLMs). Within the health care domain, LLM summarization techniques have predominantly been explored in the context of electronic health records and clinical notes summarization [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]; for example, Tariq et al [<xref ref-type="bibr" rid="ref44">44</xref>] used the text-to-text transfer transformer (T5) model to generate layperson-friendly summaries of clinical radiology notes, while Van Veen et al [<xref ref-type="bibr" rid="ref45">45</xref>] evaluated various LLMs across a range of clinical text summarization tasks and found that fine-tuned language net–T5 (FLAN-T5) and GPT-4 performed best overall.</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>This work built on previous efforts by testing unsupervised topic models not previously applied to patient data and combining word clouds in a novel way with sentiment and topic analysis to create sentiment-based color-coded word clouds per topic. In addition, we used LLM summarization to summarize patient experience data by topic, an innovative application in this context.</p>
        <p>The aims of this study were as follows:</p>
        <list list-type="order">
          <list-item>
            <p>To investigate the utility of AI-generated patient educational videos to deliver information on the breast cancer treatment pathway from the patient perspective</p>
          </list-item>
          <list-item>
            <p>To understand whether NLP techniques can generate automated insights into qualitative patient feedback</p>
          </list-item>
        </list>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data</title>
        <p>The raw patient data survey collated by HUTH included patient-identifiable data (eg, email addresses, age brackets, and hospital numbers), Likert scale responses, and free-text answers to the question “Any comments or suggestions to improve its [the video’s] contents?” For the purposes of this research and to adhere to the contractual data-processing and data-sharing agreement between Roche UK and HUTH, all patient-identifiable information was removed before data transfer to Roche UK.</p>
        <p>From the 400 patient surveys sent electronically, 255 (63.8%) responses were collected. Of the 255 respondents, 98 (38.4%) answered the open-ended question. NLP analysis was conducted on these free-text responses. All survey questions—closed ended as well as open ended—were optional. The 12 closed-ended questions had response rates ranging from 98.8% (252/255) to 100% (255/255), with 9 (75%) achieving a 100% (255/255) response rate.</p>
        <p>As depicted in <xref rid="figure1" ref-type="fig">Figure 1</xref>, data cleaning was applied to the raw survey responses to support NLP techniques used in this study (specifically topic analysis and the generation of word clouds using term frequency–inverse document frequency [TF-IDF]). These techniques aim to reduce the dimensionality (ie, the number of words used) of the responses, and data cleaning facilitates this process. The responses were cleaned by expanding contractions, lemmatizing each word, and removing stop words (noninformative words such as “the” and “of”) and punctuation (except for full stops, which were retained to enable sentence-level analysis). For sentiment analysis and summarization, the raw data were used because punctuation and stop words, including negation or intensifier words, can impact the sentiment of a sentence and affect the overall meaning. To allow for deeper analysis, responses were split into individual sentences (n=167) because it is possible that patients wrote about multiple topics and expressed varying sentiments within a single response. Data cleaning was achieved using the <italic>Natural Language Toolkit</italic> (<italic>NLTK</italic>) Python library [<xref ref-type="bibr" rid="ref46">46</xref>].</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Flowchart overview of the survey data analysis process, with examples of generated visualizations. AI: artificial intelligence; TF-IDF: term frequency–inverse document frequency.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e70971_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Analysis Pipeline</title>
        <p>NLP analysis methods were applied to both raw and cleaned data to generate meaningful insights from the unstructured patient feedback data, specifically topic and sentiment categorization of full responses and response sentiments, summaries by topic, and sentiment-based color-coded word clouds as illustrated in <xref rid="figure1" ref-type="fig">Figure 1</xref> and described in detail in the next subsection.</p>
      </sec>
      <sec>
        <title>NLP Methods</title>
        <p>All analyses were conducted using Python (version 3.9.12; Python Software Foundation).</p>
        <sec>
          <title>Sentiment Analysis</title>
          <p>To determine the sentiment of each of the patient responses, Valence Aware Dictionary and Sentiment Reasoner (VADER) was applied to the response sentences using the <italic>VADER</italic> Python package [<xref ref-type="bibr" rid="ref47">47</xref>]. VADER is a rule-based sentiment analysis tool that relies on sentiment dictionaries, in which each word has an associated sentiment score, to determine the overall sentiment of a text. The model is pretrained on social media comments, making it well suited for predicting the sentiment of short, informal texts containing expressed opinions, similar to the response data in this study. However, a manual inspection of the model’s predictions revealed that it did not reliably classify sentiment. As noted previously, this is likely due to words that are typically negative in general context (eg, “disease” and “cancer”) but should be classified as neutral, given the context of the survey.</p>
          <p>Therefore, a pretrained machine learning model was used instead, namely the popular HuggingFace model Twitter-roBERTa-base for Sentiment Analysis - Updated [<xref ref-type="bibr" rid="ref48">48</xref>], which was built using the Robustly Optimized BERT Pretraining Approach (RoBERTa) transformer architecture and trained on 124 million tweets. This model was chosen because the type of data it was trained on (tweets) is similar to that analyzed in this project (patient feedback): both contain opinions and emotional language, occasionally accompanied by punctuation or emojis to express sentiment. The model is able to process this emotional language, taking into account punctuation and emojis, both serving as important indicators of sentiment intensity used to convey a person’s emotional state. A manual inspection showed that the model reliably predicted the sentiment of the responses. Therefore, it was used to categorize both full responses and individual sentences as having positive, neutral, or negative sentiment, based on the highest probability score.</p>
        </sec>
        <sec>
          <title>Topic Analysis</title>
          <p>Given that the survey was based around feedback for the patient education video, the themes in our data were unlikely to reflect those commonly found in most patient satisfaction surveys, which tend to center on hospital or care experiences. Therefore, instead of classification approaches, we used unsupervised topic modeling techniques to allow for the identification of unexpected topics. Three popular unsupervised topic models—LDA, NMF, and BERTopic—were applied to the cleaned data, using the <italic>Gensim</italic> Python library [<xref ref-type="bibr" rid="ref49">49</xref>] for LDA and NMF and the <italic>BERTopic</italic> Python library for BERTopic [<xref ref-type="bibr" rid="ref50">50</xref>]. Each model was tested with a varying number of topics (ranging from 2 to 10) and evaluated manually for the meaningfulness and contextual relevance of the identified topics as well as topic coherence (<xref ref-type="table" rid="table1">Table 1</xref>). Topic coherence refers to the degree of semantic similarity among the topic descriptors [<xref ref-type="bibr" rid="ref51">51</xref>].</p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Highest topic coherence scores for the unsupervised topic models applied to cleaned patient response sentences, each tested with a varying number of topics (ranging from 2 to 10).</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="600"/>
              <col width="400"/>
              <thead>
                <tr valign="top">
                  <td>Models</td>
                  <td>Topic coherence score (rounded to 4 significant figures)</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>LDA<sup>a</sup></td>
                  <td>0.4844</td>
                </tr>
                <tr valign="top">
                  <td>NMF<sup>b</sup></td>
                  <td>0.4845</td>
                </tr>
                <tr valign="top">
                  <td>BERTopic (cHDBSCAN: hierarchical density-based spatial clustering of applications with noise)</td>
                  <td>0.5607</td>
                </tr>
                <tr valign="top">
                  <td>BERTopic (KeyBERT)</td>
                  <td>0.5514</td>
                </tr>
                <tr valign="top">
                  <td>BERTopic (k-means clustering with 4 clusters)</td>
                  <td>0.5467</td>
                </tr>
                <tr valign="top">
                  <td>BERTopic (KeyBERT and k-means clustering with 4 clusters)</td>
                  <td>0.5630</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table1fn1">
                <p><sup>a</sup>LDA: latent Dirichlet allocation.</p>
              </fn>
              <fn id="table1fn2">
                <p><sup>b</sup>NMF: nonnegative matrix factorization.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <p>LDA and NMF are traditional algorithms widely used for topic modeling. However, these methods offer little interpretability or insight and yielded the lowest topic coherence scores. BERTopic [<xref ref-type="bibr" rid="ref49">49</xref>], a more advanced model, was also tested using various hyperparameters. On the basis of topic coherence scores and a manual inspection of the topics and constituent words, BERTopic was the most effective at identifying meaningful topics. Once the optimal number of topics (4) was identified using the elbow method (by plotting the coherence score against the number of topics), BERTopic was reapplied with a k-means clustering model, with the number of clusters set to 4. This allowed for a visual inspection of the clusters and ensured that each sentence was assigned to a topic. This method, when combined with KeyBERT (a keyword extraction technique, implemented using the <italic>KeyBERT</italic> Python package [<xref ref-type="bibr" rid="ref52">52</xref>]), achieved the highest topic coherence score (<xref ref-type="table" rid="table1">Table 1</xref>). The identified topics were visualized by reducing the dimensionality of the data using Uniform Manifold Approximation and Projection, implemented via the <italic>Uniform Manifold Approximation and Projection-learn</italic> Python library [<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref54">54</xref>], and plotting the clusters on a 2D scatter plot.</p>
        </sec>
        <sec>
          <title>Word Clouds</title>
          <p>A word cloud was created for each topic identified through topic analysis to display the keywords used within the response sentences belonging to that topic. Keywords were identified using TF-IDF [<xref ref-type="bibr" rid="ref50">50</xref>], implemented with the TFidfVectorizer from the <italic>scikit-learn</italic> Python library [<xref ref-type="bibr" rid="ref55">55</xref>] using the following formula:</p>
          <graphic xlink:href="jmir_v27i1e70971_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          <p>where <italic>tf<sub>i,j</sub></italic> is the frequency of <italic>i</italic> (the word) in <italic>j</italic> (sentences belonging to the topic in question), and <italic>df<sub>i</sub></italic> is the number of documents (sentences) containing <italic>i</italic> across all sentences.</p>
          <p>Therefore, the size of each keyword in the word cloud corresponds to how frequently the word appeared in response sentences within a given topic, taking into account how often it appeared across all topics. Keywords were color coded by sentiment: red for negative, orange for neutral, and green for positive. For words appearing in multiple sentences, sentiment probabilities were summed, and the sentiment with the highest probability determined the overall sentiment context for that word. Word clouds were generated using the <italic>wordcloud</italic> Python package [<xref ref-type="bibr" rid="ref56">56</xref>].</p>
        </sec>
        <sec>
          <title>Summarization</title>
          <p>There are 2 main methods of text summarization: extractive summarization, which involves selecting important sentences from the input text; and abstractive summarization, which involves generating new, paraphrased content that captures the main ideas from the input text. In this study, abstractive techniques were used to produce condensed, coherent summaries, while also ensuring that no patient response data were revealed. LLMs are powerful and popular tools for performing abstractive summarization because they are pretrained on massive datasets, enabling them to learn complex language patterns and semantics. Popular LLMs include GPT-4 (OpenAI) and Claude (Anthropic). However, because these tools are accessible only through application programming interfaces, their use would have compromised the confidentiality of the patient data [<xref ref-type="bibr" rid="ref57">57</xref>]. Therefore, to summarize the responses from each of the 3 informative topics identified through topic analysis (excluding the topic comprising short responses with little or no content), 5 popular open-source downloadable abstractive text summarization models—Pegasus [<xref ref-type="bibr" rid="ref58">58</xref>], GPT-2 [<xref ref-type="bibr" rid="ref59">59</xref>], bidirectional and auto-regressive transformers [<xref ref-type="bibr" rid="ref60">60</xref>], T5 [<xref ref-type="bibr" rid="ref61">61</xref>], and the newer FLAN-T5 model [<xref ref-type="bibr" rid="ref62">62</xref>]—were tested locally, using the <italic>transformers</italic> Python library [<xref ref-type="bibr" rid="ref63">63</xref>]. These models were chosen due to their popularity and well-established abilities to perform zero-shot abstractive summarization at a high standard [<xref ref-type="bibr" rid="ref58">58</xref>-<xref ref-type="bibr" rid="ref62">62</xref>]. As human-written ground truth or “gold” summaries were not available due to time constraints and lack of resources, preference-based manual evaluation was used to compare the summaries generated by the various models. Upon reviewing the summaries against the raw data, T5 was found to be the best model for summarizing the feedback because its topic summaries best covered the main ideas pertinent to each topic without revealing raw patient response data. These T5-generated summaries were then manually edited slightly for grammatical clarity.</p>
          <p>Summaries were also generated for responses separated by topic and sentiment using each of the models; however, this level of stratification resulted in few responses per group to summarize. Consequently, the outputs of the summarization models were of poor quality, often generating nonsensical results such as repeated short phrases from the responses. Therefore, only summaries generated at the topic level were used.</p>
        </sec>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>This collaborative project between Roche UK and HUTH was approved by the HUTH legal team and chief medical officer. Regarding the collection of patient feedback via electronic surveys, Trust policy requires all audits to be registered with the trust governance system; however patient surveys are exempt [<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref65">65</xref>]. Therefore, ethical review and approval from the NHS research ethics committee were not required. Patients were given the choice to participate in this study and respond to the survey, and only those who consented provided responses. Response data were anonymized before being provided to Roche UK by removing patient email addresses. No compensation was provided to participants.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Sentiment Analysis</title>
        <p>Almost half of the patient responses (48/98, 49%) were positive, a little less than one-third (31/98, 32%) were neutral, and slightly less than one-fifth (19/98, 19%) were negative (<xref ref-type="table" rid="table2">Table 2</xref>). Responses were also split into constituent sentences and categorized by sentiment using the same NLP sentiment categorization method applied to the full responses. Analysis of the individual sentences revealed that the proportion of positive response sentences decreased slightly, whereas the proportion of neutral and negative response sentences increased. This indicates that some patient responses classified as overall positive likely contained a mixture of both positive and negative sentiment.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Sentiment analysis results for each patient response and each sentence in the responses.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="190"/>
            <col width="400"/>
            <col width="410"/>
            <thead>
              <tr valign="top">
                <td>Sentiment</td>
                <td>Responses (n=98), n (%)</td>
                <td>Sentences (n=167), n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Positive</td>
                <td>48 (49)</td>
                <td>72 (43.1)</td>
              </tr>
              <tr valign="top">
                <td>Neutral</td>
                <td>31 (31.6)</td>
                <td>56 (33.5)</td>
              </tr>
              <tr valign="top">
                <td>Negative</td>
                <td>19 (19.4)</td>
                <td>39 (23.4)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Sentiment Distribution by Rating</title>
        <p>To assess whether patients’ response sentiment correlated with their overall rating of the video, a grouped bar graph was plotted. <xref rid="figure2" ref-type="fig">Figure 2</xref> shows that most of the patients (42/60, 70%) who rated the video with the maximum score (5) expressed positive sentiment in their free-text responses. As the rating decreased, the proportion of positive responses decreased, while the proportion of negative responses increased. This pattern is logical because the patients’ overall satisfaction or dissatisfaction with the video would be reflected consistently throughout their survey responses. Furthermore, this helped validate that the sentiment analysis method used was accurate. A manual inspection was conducted of any unusual results, such as negative responses from patients who rated the video as excellent (score of 5), and verified that these were indeed correctly categorized because their content was overall negative. Of the 3 such responses, 1 (33%) included a comment about disliking the avatar wearing black, which can be taken as a suggestion for improvement. The other 2 negative responses were not about the video; rather, 1 (50%) was regarding the survey itself (the respondent found it confusing); and 1 (50%) described the respondent’s negative experience of feeling unsupported during their treatment, although the respondent expressed confidence that the video would help others feel supported. This highlights a limitation of analyzing the sentiment of the whole response as an indicator of respondents’ sentiment regarding the video because the response may not discuss only the topic of the video. Similarly, neutral responses with a video rating of 5 tended to be those that did not contain informative content or discuss the videos (eg, “No comments” or “None”). Analysis at the topic and sentence levels (<xref rid="figure3" ref-type="fig">Figure 3</xref> and <xref rid="figure4" ref-type="fig">Figure 4</xref>, respectively) provided deeper insight into patients’ perspectives on the videos.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Grouped bar graph showing free-text response sentiment distribution by video rating (response to the question “Your overall rating of this video [score between 1-5 with 5 = excellent and 1 = very poor]”).</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e70971_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Topic Analysis</title>
        <p>Four topics were identified by the BERTopic model (<xref ref-type="table" rid="table3">Table 3</xref>).</p>
        <p>K-means clustering was used to assign each sentence to a topic—ensuring that no responses were excluded from the analysis—and to visually inspect the topics. As shown in <xref rid="figure3" ref-type="fig">Figure 3</xref>, topic 0 (treatment pathway) and topic 1 (video content) are fairly overlapping topics, with some patient responses falling somewhere in between the 2 topics. Other topics are far apart, indicating minimal semantic similarity.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Topics identified by BERTopic with k-means clustering and KeyBERT.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="570"/>
            <col width="430"/>
            <thead>
              <tr valign="top">
                <td>Topic representative words</td>
                <td>Topic name</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>0: breast_treatment_care</td>
                <td>Treatment pathway<sup>a</sup></td>
              </tr>
              <tr valign="top">
                <td>1: video_videos_informative</td>
                <td>Video content<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>2: voice_impersonal_sound</td>
                <td>AI<sup>c</sup> avatar<sup>d</sup></td>
              </tr>
              <tr valign="top">
                <td>3: none_thank_add</td>
                <td>No content<sup>e</sup></td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>Topic 0: these responses tended to be about the treatment pathway and how the video fit into it or the patients’ experience of how the staff or literature supported them.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>Topic 1: these responses concerned the video content and the patients’ opinions on the information provided.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>AI: artificial intelligence.</p>
            </fn>
            <fn id="table3fn4">
              <p><sup>d</sup>Topic 2: these responses concerned the AI presenter, its voice, and a few other technical aspects of the video, such as the subtitles or the audio.</p>
            </fn>
            <fn id="table3fn5">
              <p><sup>e</sup>Topic 3: these responses were very short, such as “No comments” or “Thank you,” which did not provide any insight.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>A visualization of the topic clustering analysis of free-text response sentences. Each data point represents a patient response, color coded and labeled by the topic to which it has been assigned. Topic labels consist of the 3 most relevant words within sentences of that topic (as identified by term frequency–inverse document frequency). The distance between data points represents semantic similarity (greater distance indicates less similarity).</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e70971_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Topic Popularity</title>
        <p>To assess the popularity of each topic in patients’ feedback, the number of patients who mentioned each topic in their responses was calculated. As shown in <xref ref-type="table" rid="table4">Table 4</xref>, the treatment pathway topic was the most popular, with half of the patients (49/98, 50%) who gave free-text feedback mentioning this topic. The next most popular topic was video content, with a little less than half of the patients (43/98, 44%) mentioning this topic. Only 17% (17/98) of the patients mentioned the AI avatar.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Number of patients whose response sentences were assigned to each of the 4 identified topics (n=98; a patient could mention &gt;1 topic and the same topic in multiple sentences).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="390"/>
            <col width="610"/>
            <thead>
              <tr valign="top">
                <td>Topic</td>
                <td>Patients mentioning topic, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Treatment pathway</td>
                <td>49 (50)</td>
              </tr>
              <tr valign="top">
                <td>Video content</td>
                <td>43 (44)</td>
              </tr>
              <tr valign="top">
                <td>AI avatar</td>
                <td>17 (17)</td>
              </tr>
              <tr valign="top">
                <td>No content</td>
                <td>12 (12)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Sentiment Distribution by Topic</title>
        <p>To assess whether patients spoke about each topic positively or negatively, a grouped bar chart was created to show the sentiment of each response sentence and the topic with which it was associated. As shown in <xref rid="figure4" ref-type="fig">Figure 4</xref>, sentiment for the treatment pathway topic was mostly positive or neutral, and sentiment for the video content topic was mostly positive, whereas sentiment for the AI avatar topic was predominantly negative. This likely reflects that most patients (10/17, 59%) who mentioned the AI presenter described it as “impersonal,” which was the second most relevant word in sentences assigned to this topic.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Grouped bar graph showing free-text response sentiment distribution of sentences assigned to each topic. AI: artificial intelligence.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e70971_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Word Clouds</title>
        <p>To better understand the patients’ feedback about each aspect of the video and their associated feelings, word clouds were created to represent key words from the responses for each topic (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
        <p>As shown in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, for the treatment pathway topic, it can be interpreted that patients found that they were reassured and felt calm, the treatment pathway was faultless, and many of them were thankful.</p>
        <p>For the video content topic, positive words can be seen that likely describe how patients felt about the content, such as “informative,” “relevant,” “clear,” and “comprehensive.”</p>
        <p>Finally, for the AI avatar topic, it can be interpreted that patients who mentioned the avatar felt that it was “impersonal” and felt “disconnected” from the topic of breast cancer treatment, or they found it “distract[ing].”</p>
      </sec>
      <sec>
        <title>Summarization</title>
        <p>To identify the main takeaways from the patients’ feedback, the T5 abstractive summarization model was used to summarize response sentences from each topic (<xref ref-type="boxed-text" rid="box1">Textbox 1</xref>). The generated summaries were then manually edited and checked against the raw data for grammatical clarity and to confirm that they accurately represented the data. The summaries aligned with findings from the earlier analyses.</p>
        <boxed-text id="box1" position="float">
          <title>Manually edited artificial intelligence (AI)–generated summaries of patient feedback by the text-to-text transfer transformer model by topic.</title>
          <p>
            <bold>Treatment pathway</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>Many patients were pleased with the treatment process and felt that they were well informed throughout. The video was helpful, reassuring, and well explained. A few patients commented that they wished that they had this video at the start of the treatment.</p>
            </list-item>
          </list>
          <p>
            <bold>Video content</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>Most respondents were positive about the video content and found it to be informative, clear, concise, and easy to understand and felt that it covered the essential points of the follow-up program.</p>
            </list-item>
          </list>
          <p>
            <bold>AI avatar</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>Most respondents who mentioned the AI-generated presenter felt that the use of the presenter made the video feel impersonal and would have preferred a human presenter. A few respondents also found the AI presenter distracting, and a few mentioned that the voice was not in sync with the presenter’s lip movements.</p>
            </list-item>
          </list>
        </boxed-text>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This study evidences that patient health care education material delivered using GenAI (via an avatar) is generally received positively by patients. Moreover, algorithmic approaches such as NLP can be effectively applied to qualitative feedback to identify areas for improvement in delivering health information using this technology. This point is especially pertinent, given the current workforce constraints within an evolving NHS [<xref ref-type="bibr" rid="ref66">66</xref>], which make it infeasible to manually analyze even a small corpus (n=98) of patient feedback.</p>
        <p>In addition, this work reinforces earlier findings that large volumes of patient comments can be efficiently processed using NLP methodologies to draw meaningful and actionable insights [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref36">36</xref>-<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref67">67</xref>]. This adds to the body of evidence demonstrating that various NLP techniques, such as topic modeling and sentiment analysis, and visualization of their results provide a more profound understanding of patient feedback, in this case revealing both successful aspects of the video and areas needing improvement. New visualization techniques were explored, such as sentiment-based color-coded word clouds by topic, which provided clearer insights into the data. In addition, as the NHS elective care recovery delivery plan [<xref ref-type="bibr" rid="ref68">68</xref>] commits to providing better information and support to patients with the introduction of new and innovative ways of delivering health care, it is more important than ever that patients feel confident that their feedback is sought and integrated into new models of care. Consistent with the NHS plan’s objectives, this study demonstrated how summarization models can facilitate an overview of the patient data, significantly reducing the time required to review individual comments.</p>
        <p>Overall, the analysis revealed predominantly positive responses. Four key topics were identified, with positive feedback on the treatment pathway and video content and negative feedback concerning the digital avatar. Many patients expressed satisfaction with their experience of the breast cancer treatment pathway, noting that the videos were informative and could be a valuable and reassuring resource for patients at the beginning of the treatment pathway. Concerns regarding the avatar included its robotic or impersonal voice and the audio being out of sync with the avatar’s lip movements. However, as this technology is ever improving and producing more human-like avatars, these concerns are likely to be resolved with further model development. Other patients did not like the use of AI to create these videos at all, which could be reflective of the general mistrust of AI in health care [<xref ref-type="bibr" rid="ref69">69</xref>].</p>
        <p>This underscores an important ethical consideration in the use of such technology for health care education. While our study demonstrates the value of using AI to quickly and effectively create valuable breast cancer educational videos, this technology may not be appropriate for all types of health care–related content. Specifically, AI-generated videos may not be suitable for discussing particularly sensitive or emotional topics. Furthermore, adherence to responsible AI regulation and guidelines, as well as transparent communication with patients about the role of AI in creating educational materials, is crucial to maintaining patient trust [<xref ref-type="bibr" rid="ref70">70</xref>]. This is especially true considering the rise in misuse of GenAI technology to create videos to deceive people or spread misinformation [<xref ref-type="bibr" rid="ref71">71</xref>-<xref ref-type="bibr" rid="ref75">75</xref>]. Thus, it will be an important consideration when creating and distributing AI-generated educational videos to find ways to distinguish them as credible and reliable sources of information.</p>
        <p>These results echo those of similar studies indicating that closed-ended questions do not disclose the full picture of patient feedback and that open-ended responses are crucial for understanding the nuances of patient opinions. Consistent with the findings of Gallan et al [<xref ref-type="bibr" rid="ref28">28</xref>] in a similar study, this is further supported by the differences in sentiment between the patients’ overall video scores and their free-text responses. As shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>, some patients assigned a perfect score yet left a negative or neutral comment. Although some of these negative or neutral comments were unrelated to the video itself, a negative comment regarding the respondent’s dislike of the avatar wearing black provides an actionable insight for improving these videos.</p>
        <p>Our findings add to a wider discussion on the optimal methods for delivering health care information and promoting health literacy. Specifically, a large body of work has demonstrated that written health information is often difficult for most intended audiences to comprehend [<xref ref-type="bibr" rid="ref76">76</xref>]. A systematic review of readability assessment studies reported that most of the COVID-19 vaccine information supplied by health care providers exceeded the recommended grade reading level, which the authors hypothesize contributed to vaccine hesitancy during the pandemic [<xref ref-type="bibr" rid="ref77">77</xref>]. Another systematic review reported that web-based patient information for common sports injuries was written above the recommended reading level [<xref ref-type="bibr" rid="ref78">78</xref>]. More recently, a systematic review of written information for patients spanning 30 years highlighted that the reading level of patient information across all clinical areas was too high for patients and encouraged new modes of communication to educate patients [<xref ref-type="bibr" rid="ref79">79</xref>]. Given that almost half of the patients (48/98, 49%) in this study expressed positive sentiment toward health care information delivered using GenAI (in the form of an avatar), the reported high readability barriers may be considerably lowered by adopting this technological approach. Moreover, GenAI avatars can now automatically deliver content in &gt;140 languages with 1-click translations [<xref ref-type="bibr" rid="ref80">80</xref>], potentially further addressing language barriers in health care education [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
        <p>Beyond providing effective patient education, these videos aim to help reduce the time that specialist breast cancer care nurses spend answering common patient queries, allowing them to focus on patient care and on answering more highly specialized, treatment-related questions. While data were not collected on the impact of these AI-generated videos on reducing health care professional workloads in this study, patient educational videos have been shown to reduce the number of patients requiring direct contact with health care providers [<xref ref-type="bibr" rid="ref81">81</xref>]. Furthermore, previous studies have found that patients prefer this form of media over traditional leaflets and that educational videos improve shared decision-making in clinical practice while increasing health literacy and medication adherence [<xref ref-type="bibr" rid="ref82">82</xref>,<xref ref-type="bibr" rid="ref83">83</xref>]. However, further work is needed to confirm such beneficial impacts in our case, such as a comparison of the number of calls made by patients to breast cancer nurses before and after the introduction of these videos.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>The primary limitations of this study were the small sample size (98 responses) and patient acuity. Although splitting the data into sentences increased the dataset size and provided deeper insights, future projects would benefit from a larger sample for more accurate NLP model evaluation and pattern investigation. More data would enable the labeling and testing of the topic and sentiment models, which would provide more robust and objective accuracy metrics. Furthermore, semantic analysis could improve by incorporating higher n-grams and refining contextual polarity [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref84">84</xref>]. Finally, larger sample sizes would likely allow for more effective summarization by topic and sentiment, potentially revealing deeper insights into patient responses.</p>
        <p>If additional data cannot be collected, synthetic data generation [<xref ref-type="bibr" rid="ref85">85</xref>] and augmentation techniques such as word replacement or shuffling could be used to enhance the dataset [<xref ref-type="bibr" rid="ref86">86</xref>]; for example, Li et al [<xref ref-type="bibr" rid="ref87">87</xref>] used the synthetic minority oversampling technique (SMOTE) algorithm to balance their dataset of patient complaints to ensure equal representation across topic categories.</p>
        <p>Alternatively, improving the response rate for the open-ended question—38.4% (98/255) in this study—would help increase the sample size. This might be achieved by making the question mandatory, reordering the survey questions, or offering incentives to respondents who complete the full survey [<xref ref-type="bibr" rid="ref88">88</xref>,<xref ref-type="bibr" rid="ref89">89</xref>]. In this study, all survey questions were optional; however, in contrast to the low response rate for the open-ended questions, the closed-ended questions had a minimum response rate of 98.8% (252/255), with 9 (75%) of the 12 questions being answered by all respondents. This is expected because closed-ended questions are easier and faster to answer; however, future studies should explore ways to increase the response rate for open-ended questions to levels similar to those for closed-ended questions for a more diverse set of responses.</p>
        <p>It is worth noting that there are limitations to our sentiment analysis methods. First, although the pretrained sentiment analysis model we used is known to generally perform at a high degree of reliability, not all sentiment categorizations made by the model will be completely accurate. Precise accuracy metrics specific to our model are unavailable. However, previous research studies indicate that similar models, based on the RoBERTa architecture, demonstrate accuracies ranging from 90% to 96% [<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref90">90</xref>].</p>
        <p>Second, it is important to understand that the color of each keyword in the word cloud is associated with the sentence in which the word appears, rather than the sentiment associated with the word itself. This is because we are using sentences as a way to segment the responses into constituent topics. Although this technique helps us better understand the details of patient responses, this is not always the case in reality; for example, a sentence could contain positive sentiment about one topic and negative sentiment about another. An improvement to this method would be to segment the responses by constituent topics, rather than relying on sentence boundaries, as in aspect-based sentiment analysis [<xref ref-type="bibr" rid="ref91">91</xref>]; however, implementing this technique poses challenges and requires the adoption of more complicated models.</p>
        <p>Only relevant data were collected to answer the primary research question in accordance with the UK government’s Caldicott Principles [<xref ref-type="bibr" rid="ref92">92</xref>]. This was a necessary step in data governance and ethics approval; however, it limits the generalizability of our findings to diverse populations [<xref ref-type="bibr" rid="ref93">93</xref>] because we did not have access to any demographic data. Factors including patient age, digital literacy, opinion on technology, patient acuity (eg, patient activation scores [<xref ref-type="bibr" rid="ref94">94</xref>]), and patient confidence in managing their disease may all influence survey results [<xref ref-type="bibr" rid="ref95">95</xref>]. Further analysis of the impact of these factors on the patient perspective on the use of these videos as patient education tools would help reveal whether the findings of this study represent those of broader and more diverse patient groups.</p>
        <p>The patients with breast cancer included in this study were in remission; therefore, it is unknown whether patients with breast cancer who are undergoing active treatment regimens would have similar perspectives. This is an important consideration because the information in the 7 videos created using GenAI technology by this collaborative work is aimed at patients at different points in the treatment pathway and on different treatment regimens (eg, “Breast Pain after Surgery” for patients who have undergone mastectomy or “Endocrine Therapy” for patients receiving hormonal treatment). Furthermore, cancer stage may influence patients’ views of these videos because individuals at different stages may face varying health and social care challenges (eg, loss of a job or reduced working hours and childcare responsibilities).</p>
        <p>Digital inclusivity is another important factor to consider because 96% of breast cancers are diagnosed in women aged &gt;40 years [<xref ref-type="bibr" rid="ref96">96</xref>], as a function of lower digital literacy and internet use [<xref ref-type="bibr" rid="ref97">97</xref>,<xref ref-type="bibr" rid="ref98">98</xref>]. Thus, it is crucial that the information in these videos is delivered in an accessible way to ensure that there is no disparity in the level of service provided to a hospital’s diverse patient population. Therefore, further investigation is warranted with a broader sample of patients with breast cancer to explore diverse prospective patient feedback throughout cancer treatments.</p>
        <p>Finally, the survey response rate was 63.8% (255/400), with only 38.4% (98/255) of the respondents providing open-ended feedback. This low sample size for the open-ended free-text question may not capture the full spectrum of patient feedback. Moreover, there may exist a bias in the subset of patients with breast cancer who answered the free-text question and among those who completed the survey compared to the broader population of patients with breast cancer who completed the survey and those who were sent the survey, respectively (ie, nonresponse bias); for example, individuals with strong positive or negative opinions may be more likely to volunteer open-ended feedback, skewing the data [<xref ref-type="bibr" rid="ref27">27</xref>]. This may have contributed to the predominance of negative comments concerning the digital avatar: it is possible that those who did not have strong opinions on the avatar did not provide free-text feedback; however, further research is required to confirm this.</p>
        <p>Alternatively, factors such as digital literacy or age, as discussed previously, may have influenced a patient’s likelihood of providing feedback (at all or specifically open-ended) [<xref ref-type="bibr" rid="ref88">88</xref>,<xref ref-type="bibr" rid="ref99">99</xref>]. However, due to ethical and data privacy constraints, we cannot disclose any information about the patients who did not complete the study. This lack of comparative demographic data restricts our ability to understand and reveal any potential biases in the collected responses.</p>
      </sec>
      <sec>
        <title>Comparison to Prior Work</title>
        <p>Unlike studies that analyzed unsolicited patient comments from social media or hospital feedback sites, this project used solicited survey data. Greaves et al [<xref ref-type="bibr" rid="ref40">40</xref>] note that unsolicited comments often exhibit selection bias toward more extreme positive or negative experiences, resulting in unrepresentative, polarized results. By collecting feedback through surveys, this study minimized such bias, as evidenced by the high level of neutral feedback shown in <xref ref-type="table" rid="table2">Table 2</xref>.</p>
        <p>Splitting responses into sentences enhanced granularity, improving the understanding of topics and sentiments, as shown by the differences in the proportions of negative, neutral, and positive sentences compared to full responses (<xref ref-type="table" rid="table2">Table 2</xref>). Nawab et al [<xref ref-type="bibr" rid="ref41">41</xref>] also used sentence-level analysis but only when sentiments differed between sentences, which may have led to the omission of some topics. This approach also increased the dataset size from 98 to 167, benefiting NLP techniques that require larger datasets (namely, topic modeling, summarization, and TF-IDF word clouds). However, splitting by sentence can fail to capture all topics and sentiments accurately because sentences can contain both positive and negative sentiments. Consequently, the topic-based sentiment analysis may not be accurately representative in all cases, and word cloud colors may reflect sentence sentiment rather than the word’s overall sentiment. Splitting responses by constituent topics (multilabeling) could improve accuracy, but this approach is complex and may not suit short texts, such as those in this study (mean length 15 words, SD 10) [<xref ref-type="bibr" rid="ref100">100</xref>,<xref ref-type="bibr" rid="ref101">101</xref>].</p>
        <p>The sentiment analysis results support prior research indicating that this technique can accurately assess patient survey responses [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref67">67</xref>]. However, due to the small sample size (n=167 sentences) and the absence of labeled data, a quantitative evaluation of model accuracy was not performed; instead, visual inspection was used to identify the most suitable model.</p>
        <p>Similar to previous studies, simpler models such as VADER struggled with health-related comments [<xref ref-type="bibr" rid="ref102">102</xref>]. As mentioned previously, this is likely because the negative scores of words such as “cancer” have a big impact on the overall sentence scores, given that VADER relies on a sentiment dictionary rather than taking into account the full context of the sentence. By contrast, BERT-based models, which have not been extensively explored for patient experience data, showed promise. This study is the first to apply the HuggingFace RoBERTa model [<xref ref-type="bibr" rid="ref48">48</xref>] to patient data, although BERT-based models have been used previously; for instance, Osváth et al [<xref ref-type="bibr" rid="ref103">103</xref>] reported 72% accuracy using fine-tuned huBERT on a Hungarian Twitter (subsequently rebranded as X) dataset, while Chatzimina et al [<xref ref-type="bibr" rid="ref104">104</xref>] achieved accuracies of 95% and 91% with BERT and RoBERTa, respectively, fine-tuned on Greek patient-clinician conversations. In addition, RoBERTa-based models (trained on Wikipedia and news articles) fine-tuned on nonpatient data have demonstrated accuracies ranging between 90% and 96% [<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref90">90</xref>].</p>
        <p>In line with previous studies [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref105">105</xref>], unsupervised topic modeling effectively identified unknown topics in responses. BERTopic with KeyBERT for keyword extraction and k-means clustering emerged as the best model. This was assessed through both topic coherence (a quantitative metric) and a subjective evaluation of topic relevance. Most studies rely solely on topic coherence to evaluate models [<xref ref-type="bibr" rid="ref106">106</xref>], but in support of the evaluation methods used in this work, previous studies [<xref ref-type="bibr" rid="ref107">107</xref>-<xref ref-type="bibr" rid="ref109">109</xref>] argue for taking topic usefulness into account, with the addition of incorporating human-interpretability metrics such as word intrusion and topic intrusion. These techniques involve human assessors identifying “intruder” words or topics, helping to mitigate bias and better gauge the model’s usefulness. Future studies should include these methods with multiple assessors for a more comprehensive evaluation.</p>
        <p>Consistent with the findings of Egger and Yu [<xref ref-type="bibr" rid="ref110">110</xref>], BERTopic performed better with shorter, emotional texts than LDA and NMF. This is attributed to BERT embeddings, which capture contextual information and can effectively process diverse text elements such as emojis and punctuation. By contrast, LDA and NMF rely on a bag-of-words approach, which ignores word order and context, making them more sensitive to noise and nonstandard text elements. Furthermore, Steele et al [<xref ref-type="bibr" rid="ref111">111</xref>] similarly found success in applying BERTopic to identify care experience topics in a much larger dataset of approximately 47,000 free-text responses from patient experience surveys. The findings support the use of this method for revealing topics in unstructured patient survey response data in future, larger studies.</p>
        <p>In this study, k-means clustering was used to assign every sentence to a topic, ensuring no data loss and the inclusion of all patient responses in the analysis. However, this method may have compromised topic quality by oversimplifying data and adding noise, as indicated by the lower topic coherence score when switching from hierarchical density-based spatial clustering of applications with noise (HDBSCAN) to k-means clustering (<xref ref-type="table" rid="table1">Table 1</xref>). Nevertheless, combining k-means clustering with KeyBERT achieved the highest topic coherence.</p>
        <p>An interesting finding from the study was the negative color-coded occurrence of the term “GP” in the treatment pathway word cloud (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). This is particularly noteworthy, considering this study’s cohort: patients who had been through the treatment pathway and, therefore, should have had no contact with primary care providers such as general practitioners (GPs). Initially, it was thought that the negative color coding of this term might reflect the recent decline in patient satisfaction with GP access [<xref ref-type="bibr" rid="ref112">112</xref>,<xref ref-type="bibr" rid="ref113">113</xref>]. However, further investigation revealed that the contexts in which “GP” appeared were neutral (despite the sentences concerned being correctly classified as negative overall). Specifically, patients referred to GPs because, prior to watching the educational video, they were unaware that they should recontact their secondary care provider (breast cancer nurses) with any queries, rather than their GPs. This observation ties into broader issues surrounding cancer treatment pathways within the NHS.</p>
        <p>The COVID-19 pandemic has exacerbated backlogs in cancer care [<xref ref-type="bibr" rid="ref114">114</xref>,<xref ref-type="bibr" rid="ref115">115</xref>]. For patients with a history of cancer, clear guidance on whom to contact in the event of a suspected recurrence is critical because such clarity is linked to improved health outcomes [<xref ref-type="bibr" rid="ref116">116</xref>]. As highlighted by Breast Cancer Now, the lack of clarity can result in patients seeking help from GPs [<xref ref-type="bibr" rid="ref116">116</xref>], and this pattern is reflected in the findings of this study. These results underscore the importance of these educational videos in supporting patients to contact the right service at the right time.</p>
        <p>Abstractive summarization models were evaluated based on the quality and readability of their outputs. Recall-Oriented Understudy for Gisting Evaluation (ROUGE) <italic>F</italic>-measure scores [<xref ref-type="bibr" rid="ref117">117</xref>] are a standard metric for evaluating summarization performance. They measure the n-gram lexical overlap between the generated summary and the reference human-written “gold” summary [<xref ref-type="bibr" rid="ref118">118</xref>]. Although a gold summary did not exist to use as a benchmark in this project, an improvement in future similar studies would be to identify a validation dataset to quantitatively assess different summarization models using this metric, such as a previous patient survey and a human-written summary of the results.</p>
        <p>Through manual inspection, the T5 model performed best in summarizing patient feedback responses; the summaries generated by Pegasus, FLAN-T5, bidirectional and auto-regressive transformers, and GPT-2 were not as clear or comprehensive. This supports the findings of Nguyen et al [<xref ref-type="bibr" rid="ref119">119</xref>], who reported in their comparative evaluation of many popular summarization models that T5-generated summaries were the most readable and that Pegasus performed relatively poorly. Similarly, Tariq et al [<xref ref-type="bibr" rid="ref44">44</xref>] found success using the T5 model to summarize health-related texts. In this study, GPT-2 did not generate comprehensive summaries. However, Fu et al [<xref ref-type="bibr" rid="ref120">120</xref>] report that GPT-2 performs better when given ≥1 examples (few-shot learning) and that GPT-3 performs even better; therefore, these avenues should be explored in future related work. Interestingly, FLAN-T5—the instruction-tuned successor to T5—performed worse than the original T5 model in this study. This contrasts with the findings of Pal et al [<xref ref-type="bibr" rid="ref121">121</xref>], who reported superior ROUGE scores for FLAN-T5 in generating hospital discharge summaries. However, this is likely due to the differences in evaluation methods: Pal et al [<xref ref-type="bibr" rid="ref121">121</xref>] used ROUGE scores to benchmark generated summaries against “ground truth” discharge summaries, whereas this study relied on human-based preference evaluation due to the absence of reference “gold” summaries.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This work demonstrates the utility of GenAI videos for delivering patient information and the success of NLP techniques in accurately and efficiently generating insights into patient feedback. Sentiment analysis showed that 81% (79/98) of the patient responses were positive or neutral, with negative comments mostly related to the AI avatar. Using the BERTopic model, we identified 4 topics: the breast cancer treatment pathway, video content, the digital avatar, and short responses with little or no content. The T5 model was used to generate abstractive summaries of the responses by topic. Combining the results from these NLP techniques facilitated the creation of clear visuals and insights, including the novel combination of topic and sentiment analysis with TF-IDF to produce sentiment-based color-coded word clouds by topic. These deeper analyses revealed valuable insights into the patients’ perspectives on the video, with many commenting that they found the video informative and reassuring and that they believed that it would be a valuable resource for individuals beginning the breast cancer treatment pathway. The positive results from this work validate the use of GenAI in creating patient educational videos. Negative patient feedback mostly concerned technical issues related to the avatar that are likely to be resolved with further model development; however, similar future investigations into patient opinions will be needed to confirm this.</p>
        <p>To assess how well such GenAI videos meet the varied needs and preferences of the wider patient population, future studies should aim to recruit a larger and more diverse sample of patients with breast cancer, spanning different ages, digital literacy levels, geographies, stages of treatment, treatment regimens, and levels of patient acuity. In combination with an improvement in the free-text question response rate, this would also help to mitigate any potential impact of bias on the collected responses. Given patient consent and compliance with data privacy regulations, collecting demographic data such as age and literacy levels alongside response data would also allow for the investigation of potential biases in patient feedback, thereby improving the usability of study findings. A larger dataset would also enable more robust evaluations of NLP models, especially when combined with expert annotations of sentiment and topics as well as ground truth summaries.</p>
        <p>Overall, this study provides insight into the potential of GenAI to create patient educational videos, while identifying patient concerns that can be addressed in future AI-generated digital materials. The NLP methods applied here can be used in future, larger studies to automate efficient analysis and insight generation from unstructured patient response data.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Word clouds representing keywords extracted from patient responses for each topic. Keywords are color coded according to the sentiment of the sentences in which they appeared. For words appearing in many sentences, sentiment scores were aggregated, and the sentiment with the highest probability determined the overall sentiment context for that word. Colors indicate sentiment as follows: red for negative, orange for neutral, and green for positive.</p>
        <media xlink:href="jmir_v27i1e70971_app1.png" xlink:title="PNG File , 490 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">BERT</term>
          <def>
            <p>bidirectional encoder representations from transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">FLAN</term>
          <def>
            <p>fine-tuned language net</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">GenAI</term>
          <def>
            <p>generative artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">GP</term>
          <def>
            <p>general practitioner</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">HDBSCAN</term>
          <def>
            <p>hierarchical density-based spatial clustering of applications with noise</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">HUTH</term>
          <def>
            <p>Hull University Teaching Hospitals NHS Trust</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">LDA</term>
          <def>
            <p>latent Dirichlet allocation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">NHS</term>
          <def>
            <p>National Health Service</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">NMF</term>
          <def>
            <p>nonnegative matrix factorization</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">RoBERTa</term>
          <def>
            <p>Robustly Optimized BERT Pretraining Approach</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">ROUGE</term>
          <def>
            <p>Recall-Oriented Understudy for Gisting Evaluation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">T5</term>
          <def>
            <p>text-to-text transfer transformer</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">TF-IDF</term>
          <def>
            <p>term frequency–inverse document frequency</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb17">VADER</term>
          <def>
            <p>Valence Aware Dictionary and Sentiment Reasoner</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>Roche Products Ltd provided resources equivalent to GBP £25,000 (US $33,807.88) for this project. This work was facilitated through a joint working agreement between Roche Products Ltd and Hull University Teaching Hospitals NHS Trust (M-GB-00018961; August 2024). Financial and in-kind contributions are publicly disclosed annually on the Association of the British Pharmaceutical Industry Disclosure UK platform in line with the requirements of the association’s code of practice.</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The datasets generated or analyzed during this study are not publicly available due to patient data protection regulations but are available from the corresponding author on reasonable request.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>EC contributed to writing the original draft and reviewing and editing the manuscript. RAB contributed to reviewing and editing the manuscript. KG and DD contributed to conceptualization, resources, project administration, supervision, and reviewing and editing the manuscript. AZ contributed to supervision and reviewing and editing the manuscript. JG and DG contributed to resources, project administration, and supervision. RP contributed to resources, project administration, supervision, and reviewing and editing the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aslani</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Patient empowerment and informed decision-making</article-title>
          <source>Int J Pharm Pract</source>
          <year>2013</year>
          <month>12</month>
          <volume>21</volume>
          <issue>6</issue>
          <fpage>347</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1111/ijpp.12076</pub-id>
          <pub-id pub-id-type="medline">24188495</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Veneri</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Zdanis</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Are technology-informed methods better than traditional approaches in educating patients? A meta-analysis</article-title>
          <source>Health Educ J</source>
          <year>2018</year>
          <month>01</month>
          <day>09</day>
          <volume>77</volume>
          <issue>3</issue>
          <fpage>261</fpage>
          <lpage>76</lpage>
          <pub-id pub-id-type="doi">10.1177/0017896917741511</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <article-title>Language interpreting and translation: migrant health guide</article-title>
          <source>Office for Health Improvement and Disparities, United Kingdom Government</source>
          <year>2017</year>
          <month>6</month>
          <day>23</day>
          <access-date>2025-04-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.gov.uk/guidance/language-interpretation-migrant-health-guide">https://www.gov.uk/guidance/language-interpretation-migrant-health-guide</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Al Shamsi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Almutairi</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Al Mashrafi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Al Kalbani</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Implications of language barriers for healthcare: a systematic review</article-title>
          <source>Oman Med J</source>
          <year>2020</year>
          <month>03</month>
          <day>30</day>
          <volume>35</volume>
          <issue>2</issue>
          <fpage>e122</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32411417"/>
          </comment>
          <pub-id pub-id-type="doi">10.5001/omj.2020.40</pub-id>
          <pub-id pub-id-type="medline">32411417</pub-id>
          <pub-id pub-id-type="pii">OMJ-35-02-1900033</pub-id>
          <pub-id pub-id-type="pmcid">PMC7201401</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="web">
          <article-title>Cancer services: twelfth report of session 2021–22</article-title>
          <source>House of Commons</source>
          <year>2022</year>
          <access-date>2025-06-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://committees.parliament.uk/publications/9562/documents/161967/default/">https://committees.parliament.uk/publications/9562/documents/161967/default/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="web">
          <article-title>Collaborative working executive summary: project title: evaluating the impact of digital patient support materials on the breast cancer pathway</article-title>
          <source>Roche</source>
          <access-date>2022-10-28</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://assets.roche.com/f/172650/x/852ee21bfd/m-gb-00009460.pdf">https://assets.roche.com/f/172650/x/852ee21bfd/m-gb-00009460.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <article-title>Synthesia homepage</article-title>
          <source>Synthesia</source>
          <access-date>2024-11-06</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.synthesia.io/">https://www.synthesia.io/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="web">
          <article-title>Symptomatic breast service patient videos</article-title>
          <source>Hull University Teaching Hospitals NHS Trust</source>
          <access-date>2023-02-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.hey.nhs.uk/breast-care/patient-videos">https://www.hey.nhs.uk/breast-care/patient-videos</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khanbhai</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Anyadi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Symons</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Flott</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Darzi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mayer</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Applying natural language processing and machine learning techniques to patient experience feedback: a systematic review</article-title>
          <source>BMJ Health Care Inform</source>
          <year>2021</year>
          <month>03</month>
          <day>02</day>
          <volume>28</volume>
          <issue>1</issue>
          <fpage>e100262</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://informatics.bmj.com/lookup/pmidlookup?view=long&amp;pmid=33653690"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjhci-2020-100262</pub-id>
          <pub-id pub-id-type="medline">33653690</pub-id>
          <pub-id pub-id-type="pii">bmjhci-2020-100262</pub-id>
          <pub-id pub-id-type="pmcid">PMC7929894</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cunningham</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wells</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Qualitative analysis of 6961 free-text comments from the first National Cancer Patient Experience Survey in Scotland</article-title>
          <source>BMJ Open</source>
          <year>2017</year>
          <month>06</month>
          <day>15</day>
          <volume>7</volume>
          <issue>6</issue>
          <fpage>e015726</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&amp;pmid=28619780"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2016-015726</pub-id>
          <pub-id pub-id-type="medline">28619780</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2016-015726</pub-id>
          <pub-id pub-id-type="pmcid">PMC5734250</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abraham</surname>
              <given-names>TH</given-names>
            </name>
            <name name-style="western">
              <surname>Deen</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Hamilton</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>True</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>O'Neil</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Blanchard</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Uddo</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Analyzing free-text survey responses: an accessible strategy for developing patient-centered programs and program evaluation</article-title>
          <source>Eval Program Plann</source>
          <year>2020</year>
          <month>03</month>
          <volume>78</volume>
          <fpage>101733</fpage>
          <pub-id pub-id-type="doi">10.1016/j.evalprogplan.2019.101733</pub-id>
          <pub-id pub-id-type="medline">31675509</pub-id>
          <pub-id pub-id-type="pii">S0149-7189(19)30183-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bohr</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Memarzadeh</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>The rise of artificial intelligence in healthcare applications</article-title>
          <source>Artificial Intelligence in Healthcare</source>
          <year>2020</year>
          <publisher-loc>Cambridge, MA</publisher-loc>
          <publisher-name>Academic Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sabu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rajendra</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zenonos</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pope</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sebire</surname>
              <given-names>NJ</given-names>
            </name>
            <name name-style="western">
              <surname>Spiridou</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Key</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Automatic extraction of structured information from cardiology MRI reports</article-title>
          <source>BMJ Paediatrics Open</source>
          <year>2024</year>
          <volume>7</volume>
          <issue>2</issue>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjpaedsopen.bmj.com/content/7/Suppl_2/A27.2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjpo-2023-gosh.55</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rajendran</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zenonos</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Spear</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pope</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Embed wisely: an ensemble approach to predict ICD coding</article-title>
          <source>Proceedings of the International Workshops on Machine Learning and Principles and Practice of Knowledge Discovery in Databases</source>
          <year>2021</year>
          <conf-name>ECML PKDD 2021</conf-name>
          <conf-date>September 13-17, 2021</conf-date>
          <conf-loc>Virtual Event</conf-loc>
          <pub-id pub-id-type="doi">10.1007/978-3-030-93733-1_26</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kamel Boulos</surname>
              <given-names>MN</given-names>
            </name>
          </person-group>
          <article-title>Generative AI in medicine and healthcare: promises, opportunities and challenges</article-title>
          <source>Future Internet</source>
          <year>2023</year>
          <month>08</month>
          <day>24</day>
          <volume>15</volume>
          <issue>9</issue>
          <fpage>286</fpage>
          <pub-id pub-id-type="doi">10.3390/fi15090286</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yim</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Khuntia</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Parameswaran</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Meyers</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Preliminary evidence of the use of generative AI in health care clinical services: systematic narrative review</article-title>
          <source>JMIR Med Inform</source>
          <year>2024</year>
          <month>03</month>
          <day>20</day>
          <volume>12</volume>
          <fpage>e52073</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2024//e52073/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/52073</pub-id>
          <pub-id pub-id-type="medline">38506918</pub-id>
          <pub-id pub-id-type="pii">v12i1e52073</pub-id>
          <pub-id pub-id-type="pmcid">PMC10993141</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eriksen</surname>
              <given-names>NS</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Bakri</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Boysen</surname>
              <given-names>KB</given-names>
            </name>
            <name name-style="western">
              <surname>Klefter</surname>
              <given-names>ON</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Reinwaldt</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Grauslund</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Holm</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Subhi</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Generative artificial intelligence for increasing accessibility of patient information videos in ophthalmology</article-title>
          <source>AJO Int</source>
          <year>2024</year>
          <month>04</month>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>100016</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ajoint.2024.100016</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="web">
          <article-title>Generative AI used to create translatable paediatric care videos for LMIC hospitals</article-title>
          <source>Health Tech World</source>
          <year>2024</year>
          <month>2</month>
          <day>22</day>
          <access-date>2024-11-06</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.htworld.co.uk/news/ai/generative-ai-used-to-create-translatable-paediatric-care-videos-for-lmic-hospitals/">https://www.htworld.co.uk/news/ai/generative-ai-used-to-create-translatable-paediatric-care-videos-for-lmic-hospitals/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adeboye</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Tayal</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Odubanjo</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Siakeu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Das</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Young</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Brinkshaw</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Oni</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence in the delivery of patient care: avatar-generated videos for patient education post breast surgery</article-title>
          <source>Eur J Surg Oncol</source>
          <year>2024</year>
          <month>05</month>
          <volume>50</volume>
          <issue>1</issue>
          <fpage>108076</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ejso.2024.108076</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bastemeijer</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Boosman</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zandbelt</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Timman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>de Boer</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hazelzet</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Patient experience monitor (PEM): the development of new short-form picker experience questionnaires for hospital patients with a wide range of literacy levels</article-title>
          <source>Patient Relat Outcome Meas</source>
          <year>2020</year>
          <volume>11</volume>
          <fpage>221</fpage>
          <lpage>30</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33312007"/>
          </comment>
          <pub-id pub-id-type="doi">10.2147/PROM.S274015</pub-id>
          <pub-id pub-id-type="medline">33312007</pub-id>
          <pub-id pub-id-type="pii">274015</pub-id>
          <pub-id pub-id-type="pmcid">PMC7725101</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bowie</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>McNab</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ferguson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>de Wet</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>MacLeod</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>McKay</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>White</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Quality improvement and person-centredness: a participatory mixed methods study to develop the 'always event' concept for primary care</article-title>
          <source>BMJ Open</source>
          <year>2015</year>
          <month>04</month>
          <day>28</day>
          <volume>5</volume>
          <issue>4</issue>
          <fpage>e006667</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&amp;pmid=25922095"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2014-006667</pub-id>
          <pub-id pub-id-type="medline">25922095</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2014-006667</pub-id>
          <pub-id pub-id-type="pmcid">PMC4420967</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <collab>Institute of Medicine (US) Committee on Quality of Health Care in America</collab>
          </person-group>
          <source>Crossing the Quality Chasm: A New Health System for the 21st Century</source>
          <year>2001</year>
          <month>08</month>
          <day>30</day>
          <publisher-loc>Washington, DC</publisher-loc>
          <publisher-name>National Academies Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Coulter</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fitzpatrick</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Cornwell</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <source>Measures of Patients' Experience in Hospital: Purpose, Methods and Uses</source>
          <year>2009</year>
          <publisher-loc>London, UK</publisher-loc>
          <publisher-name>King's Fund</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Darzi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <source>High Quality Care For All: NHS Next Stage Review Final Report</source>
          <year>2008</year>
          <month>6</month>
          <publisher-loc>Leeds, England</publisher-loc>
          <publisher-name>Department of Health and Social Care National Health Service</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ziebland</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Coulter</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Calabrese</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Locock</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <source>Understanding and Using Health Experiences: Improving Patient Care</source>
          <year>2013</year>
          <publisher-loc>Oxford, UK</publisher-loc>
          <publisher-name>Oxford University Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>de Vos</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Hamming</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Boosman</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Marang-van de Mheen</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>The association between complications, incidents, and patient experience: retrospective linkage of routine patient experience surveys and safety data</article-title>
          <source>J Patient Saf</source>
          <year>2021</year>
          <month>03</month>
          <day>01</day>
          <volume>17</volume>
          <issue>2</issue>
          <fpage>e91</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1097/PTS.0000000000000581</pub-id>
          <pub-id pub-id-type="medline">30865163</pub-id>
          <pub-id pub-id-type="pii">01209203-202103000-00017</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Riiskjær</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ammentorp</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kofoed</surname>
              <given-names>PE</given-names>
            </name>
          </person-group>
          <article-title>The value of open-ended questions in surveys on patient experience: number of comments and perceived usefulness from a hospital perspective</article-title>
          <source>Int J Qual Health Care</source>
          <year>2012</year>
          <month>10</month>
          <day>25</day>
          <volume>24</volume>
          <issue>5</issue>
          <fpage>509</fpage>
          <lpage>16</lpage>
          <pub-id pub-id-type="doi">10.1093/intqhc/mzs039</pub-id>
          <pub-id pub-id-type="medline">22833616</pub-id>
          <pub-id pub-id-type="pii">mzs039</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gallan</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Girju</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Girju</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Perfect ratings with negative comments: learning from contradictory patient survey responses</article-title>
          <source>Patient Exp J</source>
          <year>2017</year>
          <month>11</month>
          <day>06</day>
          <volume>4</volume>
          <issue>3</issue>
          <fpage>15</fpage>
          <lpage>28</lpage>
          <pub-id pub-id-type="doi">10.35680/2372-0247.1234</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van Buchem</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Neve</surname>
              <given-names>OM</given-names>
            </name>
            <name name-style="western">
              <surname>Kant</surname>
              <given-names>IM</given-names>
            </name>
            <name name-style="western">
              <surname>Steyerberg</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Boosman</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hensen</surname>
              <given-names>EF</given-names>
            </name>
          </person-group>
          <article-title>Analyzing patient experiences using natural language processing: development and validation of the artificial intelligence patient reported experience measure (AI-PREM)</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2022</year>
          <month>07</month>
          <day>15</day>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>183</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-022-01923-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-022-01923-5</pub-id>
          <pub-id pub-id-type="medline">35840972</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-022-01923-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC9284859</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>McAuliffe</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <article-title>Supervised topic models</article-title>
          <source>Proceedings of the Advances in Neural Information Processing Systems 20</source>
          <year>2007</year>
          <conf-name>NIPS 2007</conf-name>
          <conf-date>December 3-6, 2007</conf-date>
          <conf-loc>Vancouver, BC</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abirami</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Askarunisa</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Sentiment analysis model to emphasize the impact of online reviews in healthcare industry</article-title>
          <source>Online Inf Rev</source>
          <year>2017</year>
          <month>08</month>
          <day>14</day>
          <volume>41</volume>
          <issue>4</issue>
          <fpage>471</fpage>
          <lpage>86</lpage>
          <pub-id pub-id-type="doi">10.1108/OIR-08-2015-0289</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bahja</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lycett</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Identifying patient experience from online resources via sentiment analysis and topic modelling</article-title>
          <source>Proceedings of the 3rd IEEE/ACM International Conference on Big Data Computing, Applications and Technologies</source>
          <year>2016</year>
          <conf-name>BDCAT '16</conf-name>
          <conf-date>December 6-9, 2016</conf-date>
          <conf-loc>Shanghai, China</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3006299.3006335</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bracher</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Corner</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wagland</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Exploring experiences of cancer care in Wales: a thematic analysis of free-text responses to the 2013 Wales Cancer Patient Experience Survey (WCPES)</article-title>
          <source>BMJ Open</source>
          <year>2016</year>
          <month>09</month>
          <day>02</day>
          <volume>6</volume>
          <issue>9</issue>
          <fpage>e011830</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&amp;pmid=27591021"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2016-011830</pub-id>
          <pub-id pub-id-type="medline">27591021</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2016-011830</pub-id>
          <pub-id pub-id-type="pmcid">PMC5020838</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Edwards</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>White</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Elwyn</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Experiencing patient-experience surveys: a qualitative study of the accounts of GPs</article-title>
          <source>Br J Gen Pract</source>
          <year>2011</year>
          <month>04</month>
          <day>01</day>
          <volume>61</volume>
          <issue>585</issue>
          <fpage>e157</fpage>
          <lpage>66</lpage>
          <pub-id pub-id-type="doi">10.3399/bjgp11x567072</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Varanasi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Tanniru</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Seeking intelligence from patient experience using text mining: analysis of emergency department data</article-title>
          <source>Inf Syst Manag</source>
          <year>2015</year>
          <month>04</month>
          <day>28</day>
          <volume>32</volume>
          <issue>3</issue>
          <fpage>220</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1080/10580530.2015.1044342</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Doing-Harris</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mowery</surname>
              <given-names>DL</given-names>
            </name>
            <name name-style="western">
              <surname>Daniels</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>WW</given-names>
            </name>
            <name name-style="western">
              <surname>Conway</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Understanding patient satisfaction with received healthcare services: a natural language processing approach</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2016</year>
          <volume>2016</volume>
          <fpage>524</fpage>
          <lpage>33</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28269848"/>
          </comment>
          <pub-id pub-id-type="medline">28269848</pub-id>
          <pub-id pub-id-type="pmcid">PMC5333198</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pradhan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hosseini</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kulanthaivel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hosseini</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Novel approach to cluster patient-generated data into actionable topics: case study of a web-based breast cancer forum</article-title>
          <source>JMIR Med Inform</source>
          <year>2018</year>
          <month>11</month>
          <day>29</day>
          <volume>6</volume>
          <issue>4</issue>
          <fpage>e45</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2018/4/e45/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/medinform.9162</pub-id>
          <pub-id pub-id-type="medline">30497991</pub-id>
          <pub-id pub-id-type="pii">v6i4e45</pub-id>
          <pub-id pub-id-type="pmcid">PMC6293240</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cammel</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>De Vos</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>van Soest</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hettne</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Boer</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Steyerberg</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Boosman</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>How to automatically turn patient experience free-text responses into actionable insights: a natural language programming (NLP) approach</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2020</year>
          <month>05</month>
          <day>27</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>97</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-020-1104-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-020-1104-5</pub-id>
          <pub-id pub-id-type="medline">32460734</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-020-1104-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC7251822</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>López</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Detz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ratanawongsa</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Sarkar</surname>
              <given-names>U</given-names>
            </name>
          </person-group>
          <article-title>What patients say about their doctors online: a qualitative content analysis</article-title>
          <source>J Gen Intern Med</source>
          <year>2012</year>
          <month>06</month>
          <day>4</day>
          <volume>27</volume>
          <issue>6</issue>
          <fpage>685</fpage>
          <lpage>92</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/22215270"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11606-011-1958-4</pub-id>
          <pub-id pub-id-type="medline">22215270</pub-id>
          <pub-id pub-id-type="pmcid">PMC3358396</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Greaves</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ramirez-Cano</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Millett</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Darzi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Donaldson</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Use of sentiment analysis for capturing patient experience from free-text comments posted online</article-title>
          <source>J Med Internet Res</source>
          <year>2013</year>
          <month>11</month>
          <day>01</day>
          <volume>15</volume>
          <issue>11</issue>
          <fpage>e239</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2013/11/e239/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.2721</pub-id>
          <pub-id pub-id-type="medline">24184993</pub-id>
          <pub-id pub-id-type="pii">v15i11e239</pub-id>
          <pub-id pub-id-type="pmcid">PMC3841376</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nawab</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ramsey</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Schreiber</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing to extract meaningful information from patient experience feedback</article-title>
          <source>Appl Clin Inform</source>
          <year>2020</year>
          <month>03</month>
          <volume>11</volume>
          <issue>2</issue>
          <fpage>242</fpage>
          <lpage>52</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32236917"/>
          </comment>
          <pub-id pub-id-type="doi">10.1055/s-0040-1708049</pub-id>
          <pub-id pub-id-type="medline">32236917</pub-id>
          <pub-id pub-id-type="pmcid">PMC7113005</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rohil</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Magotra</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>An exploratory study of automatic text summarization in biomedical and healthcare domain</article-title>
          <source>Healthc Anal</source>
          <year>2022</year>
          <month>11</month>
          <volume>2</volume>
          <fpage>100058</fpage>
          <pub-id pub-id-type="doi">10.1016/j.health.2022.100058</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thirunavukarasu</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ting</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Elangovan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gutierrez</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>TF</given-names>
            </name>
            <name name-style="western">
              <surname>Ting</surname>
              <given-names>DS</given-names>
            </name>
          </person-group>
          <article-title>Large language models in medicine</article-title>
          <source>Nat Med</source>
          <year>2023</year>
          <month>08</month>
          <day>17</day>
          <volume>29</volume>
          <issue>8</issue>
          <fpage>1930</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1038/s41591-023-02448-8</pub-id>
          <pub-id pub-id-type="medline">37460753</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-023-02448-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tariq</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fathizadeh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ramaswamy</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Trivedi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Urooj</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Stib</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>BN</given-names>
            </name>
            <name name-style="western">
              <surname>Banerjee</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Patient centric summarization of radiology findings using large language models</article-title>
          <source>medRxiv. Preprint posted online on February 05, 2024</source>
          <year>2025</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.medrxiv.org/content/10.1101/2024.02.01.24302145v1.full"/>
          </comment>
          <pub-id pub-id-type="doi">10.1101/2024.02.01.24302145</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Van Veen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Van Uden</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Blankemeier</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Delbrouck</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Aali</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bluethgen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Pareek</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Polacin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Reis</surname>
              <given-names>EP</given-names>
            </name>
            <name name-style="western">
              <surname>Seehofnerová</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rohatgi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hosamani</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ahuja</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Langlotz</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Hom</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gatidis</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pauly</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chaudhari</surname>
              <given-names>AS</given-names>
            </name>
          </person-group>
          <article-title>Clinical text summarization: adapting large language models can outperform human experts</article-title>
          <source>Res Sq</source>
          <year>2023</year>
          <month>10</month>
          <day>30</day>
          <fpage>rs.3.rs-3483777</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37961377"/>
          </comment>
          <pub-id pub-id-type="doi">10.21203/rs.3.rs-3483777/v1</pub-id>
          <pub-id pub-id-type="medline">37961377</pub-id>
          <pub-id pub-id-type="pii">rs.3.rs-3483777</pub-id>
          <pub-id pub-id-type="pmcid">PMC10635391</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bird</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Loper</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Klein</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <source>Natural Language Processing with Python</source>
          <year>2009</year>
          <publisher-loc>Sebastopol, CA</publisher-loc>
          <publisher-name>O'Reilly Media</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hutto</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gilbert</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>VADER: a parsimonious rule-based model for sentiment analysis of social media text</article-title>
          <source>Proc Int AAAI Conf Web Soc Media</source>
          <year>2014</year>
          <month>05</month>
          <day>16</day>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>216</fpage>
          <lpage>25</lpage>
          <pub-id pub-id-type="doi">10.1609/icwsm.v8i1.14550</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Loureiro</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Barbieri</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Neves</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Anke</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Camacho-Collados</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>TimeLMs: diachronic language models from Twitter</article-title>
          <source>Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics: System Demonstrations</source>
          <year>2022</year>
          <conf-name>ACL 2022</conf-name>
          <conf-date>May 22–27, 2022</conf-date>
          <conf-loc>Dublin, Ireland</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/2022.acl-demo.25</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Řehůřek</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sojka</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Software framework for topic modelling with large corpora</article-title>
          <source>Proceedings of the LREC 2010 Workshop on New Challenges for NLP Frameworks</source>
          <year>2010</year>
          <conf-name>LREC 2010</conf-name>
          <conf-date>May 17-23, 2010</conf-date>
          <conf-loc>Valletta, Malta</conf-loc>
          <pub-id pub-id-type="doi">10.13140/2.1.2393.1847</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Grootendorst</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>BERTopic: neural topic modeling with a class-based TF-IDF procedure</article-title>
          <source>arXiv. Preprint posted online on March 11, 2022</source>
          <year>2025</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2203.05794"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Newman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lau</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Grieser</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Baldwin</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Automatic evaluation of topic coherence</article-title>
          <source>Proceedings of the Human Language Technologies: The 2010 Annual Conference of the North American Chapter of the Association for Computational Linguistics</source>
          <year>2010</year>
          <conf-name>HLT '10</conf-name>
          <conf-date>June 2-4, 2010</conf-date>
          <conf-loc>Los Angeles, CA</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Grootendorst</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>KeyBERT: minimal keyword extraction with BERT</article-title>
          <source>GitHub</source>
          <access-date>2024-07-17</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/MaartenGr/KeyBERT">https://github.com/MaartenGr/KeyBERT</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McInnes</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Healy</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Saul</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Großberger</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>UMAP: uniform manifold approximation and projection</article-title>
          <source>J Open Source Softw</source>
          <year>2018</year>
          <month>09</month>
          <day>02</day>
          <volume>3</volume>
          <issue>29</issue>
          <fpage>861</fpage>
          <pub-id pub-id-type="doi">10.21105/joss.00861</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McInnes</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Healy</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Melville</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>UMAP: uniform manifold approximation and projection for dimension reduction</article-title>
          <source>arXiv. Preprint posted online on February 09, 2018</source>
          <year>2025</year>
          <pub-id pub-id-type="doi">10.48550/arXiv.1802.03426</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pedregosa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Varoquaux</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gramfort</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Michel</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Thirion</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Grisel</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Blondel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nothman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Louppe</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Prettenhofer</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Weiss</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dubourg</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Vanderplas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Passos</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cournapeau</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Brucher</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Perrot</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Duchesnay</surname>
              <given-names>É</given-names>
            </name>
          </person-group>
          <article-title>Scikit-learn: machine learning in python</article-title>
          <source>arXiv. Preprint posted online on January 02, 2012</source>
          <year>2025</year>
          <pub-id pub-id-type="doi">10.48550/arXiv.1201.0490</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mueller</surname>
              <given-names>AC</given-names>
            </name>
          </person-group>
          <article-title>Wordcloud</article-title>
          <source>Zenodo</source>
          <year>2024</year>
          <access-date>2024-07-17</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://zenodo.org/records/14062883">https://zenodo.org/records/14062883</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sallam</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT utility in healthcare education, research, and practice: systematic review on the promising perspectives and valid concerns</article-title>
          <source>Healthcare (Basel)</source>
          <year>2023</year>
          <month>03</month>
          <day>19</day>
          <volume>11</volume>
          <issue>6</issue>
          <fpage>887</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=healthcare11060887"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/healthcare11060887</pub-id>
          <pub-id pub-id-type="medline">36981544</pub-id>
          <pub-id pub-id-type="pii">healthcare11060887</pub-id>
          <pub-id pub-id-type="pmcid">PMC10048148</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Saleh</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>PEGASUS: pre-training with extracted gap-sentences for abstractive summarization</article-title>
          <source>arXiv. Preprint posted online on December 18, 2019</source>
          <year>2025</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1912.08777"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1912.08777</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Radford</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Child</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Luan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Amodei</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sutskever</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Language models are unsupervised multitask learners</article-title>
          <source>OpenAI</source>
          <year>2019</year>
          <access-date>2024-07-17</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.bibsonomy.org/bibtex/1b926ece39c03cdf5499f6540cf63babd">https://www.bibsonomy.org/bibtex/1b926ece39c03cdf5499f6540cf63babd</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lewis</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Goyal</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ghazvininejad</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mohamed</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Stoyanov</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Zettlemoyer</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>BART: denoising sequence-to-sequence pre-training for natural language generation, translation, and comprehension</article-title>
          <source>Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics</source>
          <year>2020</year>
          <conf-name>ACL 2020</conf-name>
          <conf-date>July 5-10, 2020</conf-date>
          <conf-loc>Online</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/2020.acl-main.703</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Raffel</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Shazeer</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Narang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Matena</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>Exploring the limits of transfer learning with a unified text-to-text transformer</article-title>
          <source>arXiv. Preprint posted online on October 23, 2019</source>
          <year>2025</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1910.10683"/>
          </comment>
          <pub-id pub-id-type="doi">10.5260/chara.21.2.8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>HW</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Longpre</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zoph</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tay</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Fedus</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Dehghani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Brahma</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Webson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Suzgun</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chowdhery</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Castro-Ros</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pellat</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Robinson</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Valter</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Narang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mishra</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Petrov</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chi</surname>
              <given-names>EH</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Le</surname>
              <given-names>QV</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Scaling instruction-finetuned language models</article-title>
          <source>arXiv. Preprint posted online on October 20, 2022</source>
          <year>2025</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2210.11416"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wolf</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Debut</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sanh</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Chaumond</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Delangue</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Moi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cistac</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rault</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Louf</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Funtowicz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Davison</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shleifer</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>von Platen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jernite</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Plu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Scao</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Gugger</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Drame</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lhoest</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Rush</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Transformers: state-of-the-art natural language processing</article-title>
          <source>Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing: System Demonstrations</source>
          <year>2020</year>
          <conf-name>EMNLP 2020</conf-name>
          <conf-date>November 16-20, 2020</conf-date>
          <conf-loc>Online</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/2020.emnlp-demos.6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="web">
          <article-title>Is it research?</article-title>
          <source>Hull University Teaching Hospitals NHS Trust</source>
          <access-date>2025-05-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.hey.nhs.uk/research/researchers/">https://www.hey.nhs.uk/research/researchers/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="web">
          <article-title>Defining research table</article-title>
          <source>Health Research Authority</source>
          <year>2022</year>
          <access-date>2025-05-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.hra-decisiontools.org.uk/research/docs/DefiningResearchTable_Oct2022.pdf">https://www.hra-decisiontools.org.uk/research/docs/DefiningResearchTable_Oct2022.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Anandaciva</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>The reshaping of NHS national bodies has only just started. How will it finish?</article-title>
          <source>The King's Fund</source>
          <year>2025</year>
          <month>3</month>
          <day>13</day>
          <access-date>2025-04-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.kingsfund.org.uk/insight-and-analysis/blogs/reshaping-nhs-national-bodies-started-finish">https://www.kingsfund.org.uk/insight-and-analysis/blogs/reshaping-nhs-national-bodies-started-finish</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alemi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Torii</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Clementz</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Aron</surname>
              <given-names>DC</given-names>
            </name>
          </person-group>
          <article-title>Feasibility of real-time satisfaction surveys through automated analysis of patients' unstructured comments and sentiments</article-title>
          <source>Qual Manag Health Care</source>
          <year>2012</year>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>9</fpage>
          <lpage>19</lpage>
          <pub-id pub-id-type="doi">10.1097/QMH.0b013e3182417fc4</pub-id>
          <pub-id pub-id-type="medline">22207014</pub-id>
          <pub-id pub-id-type="pii">00019514-201201000-00004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="web">
          <article-title>Delivery plan for tackling the COVID-19 backlog of elective care</article-title>
          <source>National Health Service England</source>
          <year>2022</year>
          <access-date>2024-04-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.england.nhs.uk/coronavirus/publication/delivery-plan-for-tackling-the-covid-19-backlog-of-elective-care/">https://www.england.nhs.uk/coronavirus/publication/delivery-plan-for-tackling-the-covid-19-backlog-of-elective-care/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Payerchin</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Survey shows patient mistrust of AI use in health care</article-title>
          <source>Urology Times</source>
          <year>2023</year>
          <month>10</month>
          <day>17</day>
          <access-date>2025-04-03</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.urologytimes.com/view/survey-shows-patient-mistrust-of-ai-use-in-health-care">https://www.urologytimes.com/view/survey-shows-patient-mistrust-of-ai-use-in-health-care</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lekadir</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Frangi</surname>
              <given-names>AF</given-names>
            </name>
            <name name-style="western">
              <surname>Porras</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Glocker</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Cintas</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Langlotz</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Weicken</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Asselbergs</surname>
              <given-names>FW</given-names>
            </name>
            <name name-style="western">
              <surname>Prior</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Kaissis</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Tsakou</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Buvat</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Kalpathy-Cramer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mongan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schnabel</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Kushibar</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Riklund</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Marias</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Amugongo</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Fromont</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Maier-Hein</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cerdá-Alberich</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Martí-Bonmatí</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cardoso</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bobowicz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shabani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tsiknakis</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zuluaga</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Fritzsche</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Camacho</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Linguraru</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Wenzel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>De Bruijne</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tolsgaard</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Goisauf</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cano Abadía</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Papanikolaou</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Lazrak</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Pujol</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Osuala</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Napel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Colantonio</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Joshi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Klein</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Aussó</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rogers</surname>
              <given-names>WA</given-names>
            </name>
            <name name-style="western">
              <surname>Salahuddin</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Starmans</surname>
              <given-names>MP</given-names>
            </name>
          </person-group>
          <article-title>FUTURE-AI: international consensus guideline for trustworthy and deployable artificial intelligence in healthcare</article-title>
          <source>BMJ</source>
          <year>2025</year>
          <month>02</month>
          <day>05</day>
          <volume>388</volume>
          <fpage>e081554</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.bmj.com/lookup/pmidlookup?view=long&amp;pmid=39909534"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj-2024-081554</pub-id>
          <pub-id pub-id-type="medline">39909534</pub-id>
          <pub-id pub-id-type="pmcid">PMC11795397</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Monteith</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Glenn</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Geddes</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Whybrow</surname>
              <given-names>PC</given-names>
            </name>
            <name name-style="western">
              <surname>Achtyes</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bauer</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence and increasing misinformation</article-title>
          <source>Br J Psychiatry</source>
          <year>2024</year>
          <month>02</month>
          <volume>224</volume>
          <issue>2</issue>
          <fpage>33</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="doi">10.1192/bjp.2023.136</pub-id>
          <pub-id pub-id-type="medline">37881016</pub-id>
          <pub-id pub-id-type="pii">S0007125023001368</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Menz</surname>
              <given-names>BD</given-names>
            </name>
            <name name-style="western">
              <surname>Modi</surname>
              <given-names>ND</given-names>
            </name>
            <name name-style="western">
              <surname>Sorich</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hopkins</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Health disinformation use case highlighting the urgent need for artificial intelligence vigilance: weapons of mass disinformation</article-title>
          <source>JAMA Intern Med</source>
          <year>2024</year>
          <month>01</month>
          <day>01</day>
          <volume>184</volume>
          <issue>1</issue>
          <fpage>92</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1001/jamainternmed.2023.5947</pub-id>
          <pub-id pub-id-type="medline">37955873</pub-id>
          <pub-id pub-id-type="pii">2811333</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stokel-Walker</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Deepfakes and doctors: how people are being fooled by social media scams</article-title>
          <source>BMJ</source>
          <year>2024</year>
          <month>07</month>
          <day>17</day>
          <volume>386</volume>
          <fpage>q1319</fpage>
          <pub-id pub-id-type="doi">10.1136/bmj.q1319</pub-id>
          <pub-id pub-id-type="medline">39019557</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Swartz</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>How people are being tricked by deepfake doctor videos on social media</article-title>
          <source>New York Post</source>
          <year>2024</year>
          <month>7</month>
          <day>17</day>
          <access-date>2025-04-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://nypost.com/2024/07/17/health/how-people-are-being-tricked-by-deepfake-doctor-videos/">https://nypost.com/2024/07/17/health/how-people-are-being-tricked-by-deepfake-doctor-videos/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Given</surname>
              <given-names>LM</given-names>
            </name>
          </person-group>
          <article-title>Generative AI and deepfakes are fuelling health misinformation. Here’s what to look out for so you don’t get scammed</article-title>
          <source>The Conversation</source>
          <year>2025</year>
          <month>3</month>
          <day>13</day>
          <access-date>2025-04-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://theconversation.com/generative-ai-and-deepfakes-are-fuelling-health-misinformation-heres-what-to-look-out-for-so-you-dont-get-scammed-246149">https://theconversation.com/generative-ai-and-deepfakes-are-fuelling-health-misinformation-heres-what-to-look-out-for-so-you-dont-get-scammed-246149</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rudd</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Oppenheimer</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nath</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <source>Health Literacy: An Update of Medical and Public Health Literature</source>
          <year>2007</year>
          <publisher-loc>Milton Park, UK</publisher-loc>
          <publisher-name>Routledge</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Okuhara</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ishikawa</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ueno</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Okada</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kato</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kiuchi</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Readability assessment of vaccine information: a systematic review for addressing vaccine hesitancy</article-title>
          <source>Patient Educ Couns</source>
          <year>2022</year>
          <month>02</month>
          <volume>105</volume>
          <issue>2</issue>
          <fpage>331</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1016/j.pec.2021.05.039</pub-id>
          <pub-id pub-id-type="medline">34090717</pub-id>
          <pub-id pub-id-type="pii">S0738-3991(21)00395-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abdullah</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Alokozai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>O'Connell</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mulcahey</surname>
              <given-names>MK</given-names>
            </name>
          </person-group>
          <article-title>Online patient education materials for common sports injuries are written at too-high of a reading level: a systematic review</article-title>
          <source>Arthrosc Sports Med Rehabil</source>
          <year>2022</year>
          <month>06</month>
          <volume>4</volume>
          <issue>3</issue>
          <fpage>e861</fpage>
          <lpage>75</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2666-061X(21)00283-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.asmr.2021.12.017</pub-id>
          <pub-id pub-id-type="medline">35747648</pub-id>
          <pub-id pub-id-type="pii">S2666-061X(21)00283-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC9210373</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref79">
        <label>79</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Okuhara</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Furukawa</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Okada</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yokota</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kiuchi</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Readability of written information for patients across 30 years: a systematic review of systematic reviews</article-title>
          <source>Patient Educ Couns</source>
          <year>2025</year>
          <month>06</month>
          <volume>135</volume>
          <fpage>108656</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0738-3991(25)00023-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.pec.2025.108656</pub-id>
          <pub-id pub-id-type="medline">40068244</pub-id>
          <pub-id pub-id-type="pii">S0738-3991(25)00023-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref80">
        <label>80</label>
        <nlm-citation citation-type="web">
          <article-title>AI video translator</article-title>
          <source>Synthesia</source>
          <access-date>2025-05-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.synthesia.io/features/video-translator">https://www.synthesia.io/features/video-translator</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref81">
        <label>81</label>
        <nlm-citation citation-type="web">
          <article-title>National patient information video library added to nhs.uk homepage</article-title>
          <source>National Health Service Torbay and South Devon NHS Foundation Trust</source>
          <year>2021</year>
          <month>2</month>
          <day>2</day>
          <access-date>2024-08-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.torbayandsouthdevon.nhs.uk/about-us/news-and-publications/news/2021/02/national-patient-information-video-library-added-to-nhs-uk-20637/">https://www.torbayandsouthdevon.nhs.uk/about-us/news-and-publications/news/2021/02/national-patient-information-video-library-added-to-nhs-uk-20637/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref82">
        <label>82</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hung</surname>
              <given-names>CT</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>YH</given-names>
            </name>
            <name name-style="western">
              <surname>Hung</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Chiang</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>CY</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>WM</given-names>
            </name>
          </person-group>
          <article-title>Clinician-created educational video for shared decision-making in the outpatient management of acne</article-title>
          <source>PLoS One</source>
          <year>2022</year>
          <month>7</month>
          <day>8</day>
          <volume>17</volume>
          <issue>7</issue>
          <fpage>e0271100</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0271100"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0271100</pub-id>
          <pub-id pub-id-type="medline">35802643</pub-id>
          <pub-id pub-id-type="pii">PONE-D-22-09574</pub-id>
          <pub-id pub-id-type="pmcid">PMC9269380</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref83">
        <label>83</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mbanda</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Dada</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bastable</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ingalill</surname>
              <given-names>GB</given-names>
            </name>
            <name name-style="western">
              <surname>Ralf</surname>
              <given-names>WS</given-names>
            </name>
          </person-group>
          <article-title>A scoping review of the use of visual aids in health education materials for persons with low-literacy levels</article-title>
          <source>Patient Educ Couns</source>
          <year>2021</year>
          <month>05</month>
          <volume>104</volume>
          <issue>5</issue>
          <fpage>998</fpage>
          <lpage>1017</lpage>
          <pub-id pub-id-type="doi">10.1016/j.pec.2020.11.034</pub-id>
          <pub-id pub-id-type="medline">33339657</pub-id>
          <pub-id pub-id-type="pii">S0738-3991(20)30658-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref84">
        <label>84</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wiebe</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffmann</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Recognizing contextual polarity in phrase-level sentiment analysis</article-title>
          <source>Proceedings of the Conference on Human Language Technology and Empirical Methods in Natural Language Processing</source>
          <year>2005</year>
          <conf-name>HLT '05</conf-name>
          <conf-date>October 6-8, 2005</conf-date>
          <conf-loc>Vancouver, BC</conf-loc>
          <pub-id pub-id-type="doi">10.3115/1220575.1220619</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref85">
        <label>85</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Quteineh</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Samothrakis</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sutcliffe</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Textual data augmentation for efficient active learning on tiny datasets</article-title>
          <source>Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing</source>
          <year>2020</year>
          <conf-name>EMNLP 2020</conf-name>
          <conf-date>November 16-20, 2020</conf-date>
          <conf-loc>Online</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/2020.emnlp-main.600</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref86">
        <label>86</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mnasri</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Text augmentation for Machine Learning tasks: how to grow your text dataset for classification?</article-title>
          <source>Medium</source>
          <year>2019</year>
          <month>1</month>
          <day>18</day>
          <access-date>2025-04-03</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medium.com/opla/text-augmentation-for-machine-learning-tasks-how-to-grow-your-text-dataset-for-classification-38a9a207f88d">https://medium.com/opla/text-augmentation-for-machine-learning-tasks-how-to-grow-your-text-dataset-for-classification-38a9a207f88d</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref87">
        <label>87</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Shu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Kong</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Fang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Lou</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>An intelligent system for classifying patient complaints using machine learning and natural language processing: development and validation study</article-title>
          <source>J Med Internet Res</source>
          <year>2025</year>
          <month>01</month>
          <day>08</day>
          <volume>27</volume>
          <fpage>e55721</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2025//e55721/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/55721</pub-id>
          <pub-id pub-id-type="medline">39778195</pub-id>
          <pub-id pub-id-type="pii">v27i1e55721</pub-id>
          <pub-id pub-id-type="pmcid">PMC11754990</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref88">
        <label>88</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hahn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kroehne</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Merk</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Improving and analyzing open-ended survey responses: a case study linking psychological theories and analysis approaches for text data</article-title>
          <source>Zeitschrift für Psychologie</source>
          <year>2024</year>
          <month>07</month>
          <volume>232</volume>
          <issue>3</issue>
          <fpage>171</fpage>
          <lpage>80</lpage>
          <pub-id pub-id-type="doi">10.1027/2151-2604/a000566</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref89">
        <label>89</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Booker</surname>
              <given-names>QS</given-names>
            </name>
            <name name-style="western">
              <surname>Austin</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Balasubramanian</surname>
              <given-names>BA</given-names>
            </name>
          </person-group>
          <article-title>Survey strategies to increase participant response rates in primary care research studies</article-title>
          <source>Fam Pract</source>
          <year>2021</year>
          <month>09</month>
          <day>25</day>
          <volume>38</volume>
          <issue>5</issue>
          <fpage>699</fpage>
          <lpage>702</lpage>
          <pub-id pub-id-type="doi">10.1093/fampra/cmab070</pub-id>
          <pub-id pub-id-type="medline">34213547</pub-id>
          <pub-id pub-id-type="pii">6313102</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref90">
        <label>90</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pranay Kumar</surname>
              <given-names>BV</given-names>
            </name>
            <name name-style="western">
              <surname>Sadanandam</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A fusion architecture of BERT and RoBERTa for enhanced performance of sentiment analysis of social media platforms</article-title>
          <source>SSRN. Preprint posted online on May 27, 2023</source>
          <year>2025</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://papers.ssrn.com/sol3/papers.cfm?abstract_id=4455231"/>
          </comment>
          <pub-id pub-id-type="doi">10.2139/ssrn.4455231</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref91">
        <label>91</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hua</surname>
              <given-names>YC</given-names>
            </name>
            <name name-style="western">
              <surname>Denny</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wicker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Taskova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>A systematic review of aspect-based sentiment analysis: domains, methods, and trends</article-title>
          <source>Artif Intell Rev</source>
          <year>2024</year>
          <month>09</month>
          <day>17</day>
          <volume>57</volume>
          <fpage>296</fpage>
          <pub-id pub-id-type="doi">10.1007/s10462-024-10906-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref92">
        <label>92</label>
        <nlm-citation citation-type="web">
          <article-title>Guidance: the Caldicott principles</article-title>
          <source>National Data Guardian</source>
          <year>2020</year>
          <access-date>2025-04-03</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.gov.uk/government/publications/the-caldicott-principles">https://www.gov.uk/government/publications/the-caldicott-principles</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref93">
        <label>93</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Helen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fargotstein</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Importance of response rates</article-title>
          <source>The SAGE Encyclopedia of Communication Research Methods: Survey Response Rates</source>
          <year>2008</year>
          <publisher-loc>Thousand Oaks, CA</publisher-loc>
          <publisher-name>SAGE Publications</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref94">
        <label>94</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hibbard</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Stockard</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mahoney</surname>
              <given-names>ER</given-names>
            </name>
            <name name-style="western">
              <surname>Tusler</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Development of the Patient Activation Measure (PAM): conceptualizing and measuring activation in patients and consumers</article-title>
          <source>Health Serv Res</source>
          <year>2004</year>
          <month>08</month>
          <volume>39</volume>
          <issue>4 Pt 1</issue>
          <fpage>1005</fpage>
          <lpage>26</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/15230939"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/j.1475-6773.2004.00269.x</pub-id>
          <pub-id pub-id-type="medline">15230939</pub-id>
          <pub-id pub-id-type="pii">HESR269</pub-id>
          <pub-id pub-id-type="pmcid">PMC1361049</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref95">
        <label>95</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Compton</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Glass</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Fowler</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Evidence of selection bias and non-response bias in patient satisfaction surveys</article-title>
          <source>Iowa Orthop J</source>
          <year>2019</year>
          <volume>39</volume>
          <issue>1</issue>
          <fpage>195</fpage>
          <lpage>201</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31413694"/>
          </comment>
          <pub-id pub-id-type="medline">31413694</pub-id>
          <pub-id pub-id-type="pmcid">PMC6604521</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref96">
        <label>96</label>
        <nlm-citation citation-type="web">
          <article-title>Facts and figures</article-title>
          <source>Breast Cancer UK</source>
          <access-date>2025-04-03</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.breastcanceruk.org.uk/about-breast-cancer/facts-figures-and-qas/facts-and-figures/">https://www.breastcanceruk.org.uk/about-breast-cancer/facts-figures-and-qas/facts-and-figures/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref97">
        <label>97</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Matthews</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nazroo</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Understanding digital engagement in later life</article-title>
          <source>United Kingdom Government</source>
          <year>2015</year>
          <month>5</month>
          <access-date>2025-04-03</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://assets.publishing.service.gov.uk/media/5a81a1e2e5274a2e8ab5508b/FullReport-UnderstandingDigitalEngagementinLaterLife.docx.pdf">https://assets.publishing.service.gov.uk/media/5a81a1e2e5274a2e8ab5508b/FullReport-UnderstandingDigitalEngagementinLaterLife.docx.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref98">
        <label>98</label>
        <nlm-citation citation-type="web">
          <article-title>Offline and overlooked</article-title>
          <source>Age UK</source>
          <access-date>2025-04-03</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ageuk.org.uk/our-impact/campaigning/offline-overlooked/">https://www.ageuk.org.uk/our-impact/campaigning/offline-overlooked/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref99">
        <label>99</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Boscardin</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzales</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>The impact of demographic characteristics on nonresponse in an ambulatory patient satisfaction survey</article-title>
          <source>Jt Comm J Qual Patient Saf</source>
          <year>2013</year>
          <month>03</month>
          <volume>39</volume>
          <issue>3</issue>
          <fpage>123</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1016/s1553-7250(13)39018-7</pub-id>
          <pub-id pub-id-type="medline">23516762</pub-id>
          <pub-id pub-id-type="pii">S1553-7250(13)39018-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref100">
        <label>100</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Abdollahi</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Multi-label classification of short texts with label correlated recurrent neural networks</article-title>
          <source>Proceedings of the 2021 ACM SIGIR International Conference on Theory of Information Retrieval</source>
          <year>2021</year>
          <conf-name>ICTIR '21</conf-name>
          <conf-date>July 11, 2021</conf-date>
          <conf-loc>Virtual Event</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3471158.3472246</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref101">
        <label>101</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carrera-Trejo</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Sidorov</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Miranda-Jiménez</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Moreno Ibarra</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cadena Martínez</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Latent dirichlet allocation complement in the vector space model for multi-label text classification</article-title>
          <source>Int J Comb Optim Probl Informatics</source>
          <year>2015</year>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>7</fpage>
          <lpage>19</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ijcopi.org/ojs/article/view/58"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref102">
        <label>102</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>He</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>How do general-purpose sentiment analyzers perform when applied to health-related online social media data?</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2019</year>
          <month>08</month>
          <day>21</day>
          <volume>264</volume>
          <fpage>1208</fpage>
          <lpage>12</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31438117"/>
          </comment>
          <pub-id pub-id-type="doi">10.3233/SHTI190418</pub-id>
          <pub-id pub-id-type="medline">31438117</pub-id>
          <pub-id pub-id-type="pii">SHTI190418</pub-id>
          <pub-id pub-id-type="pmcid">PMC8061710</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref103">
        <label>103</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Osváth</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>ZG</given-names>
            </name>
            <name name-style="western">
              <surname>Kósa</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Analyzing narratives of patient experiences: a BERT topic modeling approach</article-title>
          <source>Acta Polytech Hung</source>
          <year>2023</year>
          <volume>20</volume>
          <issue>7</issue>
          <fpage>153</fpage>
          <lpage>71</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://acta.uni-obuda.hu/Osvath_Yang_Kosa_136.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.12700/APH.20.7.2023.7.9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref104">
        <label>104</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chatzimina</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Papadaki</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Pontikoglou</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tsiknakis</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A comparative sentiment analysis of Greek clinical conversations using BERT, RoBERTa, GPT-2, and XLNet</article-title>
          <source>Bioengineering (Basel)</source>
          <year>2024</year>
          <month>05</month>
          <day>21</day>
          <volume>11</volume>
          <issue>6</issue>
          <fpage>521</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=bioengineering11060521"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/bioengineering11060521</pub-id>
          <pub-id pub-id-type="medline">38927757</pub-id>
          <pub-id pub-id-type="pii">bioengineering11060521</pub-id>
          <pub-id pub-id-type="pmcid">PMC11200492</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref105">
        <label>105</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wallace</surname>
              <given-names>BC</given-names>
            </name>
            <name name-style="western">
              <surname>Paul</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Sarkar</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Trikalinos</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Dredze</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A large-scale quantitative analysis of latent factors and sentiment in online doctor reviews</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2014</year>
          <volume>21</volume>
          <issue>6</issue>
          <fpage>1098</fpage>
          <lpage>103</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/24918109"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2014-002711</pub-id>
          <pub-id pub-id-type="medline">24918109</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2014-002711</pub-id>
          <pub-id pub-id-type="pmcid">PMC4215053</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref106">
        <label>106</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hoyle</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Goel</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Peskov</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hian-Cheong</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Boyd-Graber</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Resnik</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Is automated topic model evaluation broken?: the incoherence of coherence</article-title>
          <source>arXiv. Preprint posted online on July 5, 2021</source>
          <year>2025</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2107.02173"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2107.02173</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref107">
        <label>107</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gerrish</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Boyd-graber</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>Reading tea leaves: how humans interpret topic models</article-title>
          <source>Proceedings of the Advances in Neural Information Processing Systems 22</source>
          <year>2009</year>
          <conf-name>NIPS 2009</conf-name>
          <conf-date>December 7-10, 2009</conf-date>
          <conf-loc>Vancouver, BC</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://proceedings.neurips.cc/paper_files/paper/2009/file/f92586a25bb3145facd64ab20fd554ff-Paper.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref108">
        <label>108</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lau</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Newman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Baldwin</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Machine reading tea leaves: automatically evaluating topic coherence and topic model quality</article-title>
          <source>Proceedings of the 14th Conference of the European Chapter of the Association for Computational Linguistics</source>
          <year>2014</year>
          <conf-name>EACL 2014</conf-name>
          <conf-date>April 26-30, 2014</conf-date>
          <conf-loc>Gothenburg, Sweden</conf-loc>
          <pub-id pub-id-type="doi">10.3115/v1/e14-1056</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref109">
        <label>109</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhatia</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lau</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Baldwin</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Topic intrusion for automatic topic model evaluation</article-title>
          <source>Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing</source>
          <year>2018</year>
          <conf-name>EMNLP 2018</conf-name>
          <conf-date>October 31-November 4, 2018</conf-date>
          <conf-loc>Brussels, Belgium</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/d18-1098</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref110">
        <label>110</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Egger</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>A topic modeling comparison between LDA, NMF, Top2Vec, and BERTopic to demystify Twitter posts</article-title>
          <source>Front Sociol</source>
          <year>2022</year>
          <month>5</month>
          <day>6</day>
          <volume>7</volume>
          <fpage>886498</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35602001"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fsoc.2022.886498</pub-id>
          <pub-id pub-id-type="medline">35602001</pub-id>
          <pub-id pub-id-type="pmcid">PMC9120935</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref111">
        <label>111</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Steele</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Fairie</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kemp</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>D'Souza</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Wilms</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Santana</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Identifying patient-reported care experiences in free-text survey comments: topic modeling study</article-title>
          <source>JMIR Med Inform</source>
          <year>2025</year>
          <month>02</month>
          <day>24</day>
          <volume>13</volume>
          <fpage>e63466</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2025//e63466/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/63466</pub-id>
          <pub-id pub-id-type="medline">39993226</pub-id>
          <pub-id pub-id-type="pii">v13i1e63466</pub-id>
          <pub-id pub-id-type="pmcid">PMC11875393</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref112">
        <label>112</label>
        <nlm-citation citation-type="web">
          <article-title>GP Patient Survey homepage</article-title>
          <source>GP Patient Survey</source>
          <access-date>2024-02-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.gp-patient.co.uk/">https://www.gp-patient.co.uk/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref113">
        <label>113</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fisher</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Beech</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Alderwick</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Price</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ansari</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dixon-Woods</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sinnott</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Rethinking access to general practice: it’s not all about supply</article-title>
          <source>The Health Foundation</source>
          <year>2024</year>
          <month>3</month>
          <day>5</day>
          <access-date>2025-04-03</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.health.org.uk/sites/default/files/pdf/2024-03/Rethinking%20access%20to%20general%20practice_0.pdf">https://www.health.org.uk/sites/default/files/pdf/2024-03/Rethinking%20access%20to%20general%20practice_0.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref114">
        <label>114</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aggarwal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Walter</surname>
              <given-names>FM</given-names>
            </name>
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>van der Meulen</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>"Shopping around" for treatment is not a solution to cancer backlog</article-title>
          <source>BMJ</source>
          <year>2022</year>
          <month>10</month>
          <day>10</day>
          <volume>379</volume>
          <fpage>e071967</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.bmj.com/lookup/pmidlookup?view=long&amp;pmid=36216385"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj-2022-071967</pub-id>
          <pub-id pub-id-type="medline">36216385</pub-id>
          <pub-id pub-id-type="pmcid">PMC9619362</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref115">
        <label>115</label>
        <nlm-citation citation-type="web">
          <article-title>Over 2 million people in backlog for cancer care</article-title>
          <source>Cancer Research UK</source>
          <year>2020</year>
          <month>6</month>
          <day>1</day>
          <access-date>2023-11-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://news.cancerresearchuk.org/2020/06/01/over-2-million-people-in-backlog-for-cancer-care/">https://news.cancerresearchuk.org/2020/06/01/over-2-million-people-in-backlog-for-cancer-care/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref116">
        <label>116</label>
        <nlm-citation citation-type="web">
          <article-title>Clearing the path to diagnosis: improving referral pathways in England for people with secondary breast cancer</article-title>
          <source>Breast Cancer Now</source>
          <access-date>2022-10-03</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://breastcancernow.org/media-assets/y3xahjbq/nss-pathway-report.pdf">https://breastcancernow.org/media-assets/y3xahjbq/nss-pathway-report.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref117">
        <label>117</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>CY</given-names>
            </name>
          </person-group>
          <article-title>ROUGE: a package for automatic evaluation of summaries</article-title>
          <source>Proceedings of the ACL Workshop: Text Summarization Braches Out 2004</source>
          <year>2004</year>
          <conf-name>ACL 2004</conf-name>
          <conf-date>July 21-26, 2004</conf-date>
          <conf-loc>Barcelona, Spain</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/W04-1013/"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref118">
        <label>118</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>PS</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>A systematic survey of text summarization: from statistical methods to large language models</article-title>
          <source>ACM Comput Surv</source>
          <year>2025</year>
          <month>04</month>
          <day>19</day>
          <pub-id pub-id-type="doi">10.1145/3731445</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref119">
        <label>119</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Pobbathi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>A comparative study of quality evaluation methods for text summarization</article-title>
          <source>arXiv. Preprint posted online on June 30, 2024</source>
          <year>2025</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2407.00747"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2407.00747</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref120">
        <label>120</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>GPTScore: evaluate as you desire</article-title>
          <source>arXiv. Preprint posted online on February 8, 2023</source>
          <year>2025</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2302.04166"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/2024.naacl-long.365</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref121">
        <label>121</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pal</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Bahrainian</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Mercurio</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Eickhoff</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Neural summarization of electronic health records</article-title>
          <source>arXiv. Preprint posted online on May 24, 2023</source>
          <year>2025</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2305.15222"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/preprints.49544</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
