<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v27i1e55721</article-id>
      <article-id pub-id-type="pmid">39778195</article-id>
      <article-id pub-id-type="doi">10.2196/55721</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>An Intelligent System for Classifying Patient Complaints Using Machine Learning and Natural Language Processing: Development and Validation Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Coristine</surname>
            <given-names>Andrew</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Liang</surname>
            <given-names>Jun</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Elbattah</surname>
            <given-names>Mahmoud</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Sure</surname>
            <given-names>Tharun Anand Reddy</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Vakharia</surname>
            <given-names>Vinay</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Xiadong</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9956-9111</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Shu</surname>
            <given-names>Qiang</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4106-6255</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Kong</surname>
            <given-names>Canhong</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0002-4007-7494</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Jinhu</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7749-2475</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Gang</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0007-2069-5056</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Fang</surname>
            <given-names>Xin</given-names>
          </name>
          <degrees>MA</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0001-7593-1649</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Lou</surname>
            <given-names>Xiaomin</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0009-0645-2888</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>Gang</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Children's Hospital</institution>
            <institution>Zhejiang University School of Medicine</institution>
            <institution>National Clinical Research Center For Child Health</institution>
            <addr-line>No. 3333, Binsheng Road, Binjiang District, Hangzhou</addr-line>
            <addr-line>Hang Zhou, 310020</addr-line>
            <country>China</country>
            <phone>86 13588773370</phone>
            <email>yugbme@zju.edu.cn</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9935-9969</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Children's Hospital</institution>
        <institution>Zhejiang University School of Medicine</institution>
        <institution>National Clinical Research Center For Child Health</institution>
        <addr-line>Hang Zhou</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Patient Service Surveillance Office</institution>
        <institution>Medical Information Department</institution>
        <institution>Hangzhou Red Cross Hospital</institution>
        <addr-line>Hang Zhou</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Radiation Oncology</institution>
        <institution>Zhe Jiang Xiaoshan hospital</institution>
        <institution>Hangzhou Normal University</institution>
        <addr-line>Hang Zhou</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Hospital Management Office</institution>
        <institution>Hangzhou Cancer Hospital</institution>
        <addr-line>Hang Zhou</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Patient Service Surveillance Office</institution>
        <institution>Hangzhou Red Cross Hospital</institution>
        <addr-line>Hang Zhou</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Gang Yu <email>yugbme@zju.edu.cn</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2025</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>8</day>
        <month>1</month>
        <year>2025</year>
      </pub-date>
      <volume>27</volume>
      <elocation-id>e55721</elocation-id>
      <history>
        <date date-type="received">
          <day>21</day>
          <month>12</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>12</day>
          <month>3</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>28</day>
          <month>4</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>4</day>
          <month>11</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Xiadong Li, Qiang Shu, Canhong Kong, Jinhu Wang, Gang Li, Xin Fang, Xiaomin Lou, Gang Yu. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 08.01.2025.</copyright-statement>
      <copyright-year>2025</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2025/1/e55721" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Accurate classification of patient complaints is crucial for enhancing patient satisfaction management in health care settings. Traditional manual methods for categorizing complaints often lack efficiency and precision. Thus, there is a growing demand for advanced and automated approaches to streamline the classification process.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to develop and validate an intelligent system for automatically classifying patient complaints using machine learning (ML) and natural language processing (NLP) techniques.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>An ML-based NLP technology was proposed to extract frequently occurring dissatisfactory words related to departments, staff, and key treatment procedures. A dataset containing 1465 complaint records from 2019 to 2023 was used for training and validation, with an additional 376 complaints from Hangzhou Cancer Hospital serving as an external test set. Complaints were categorized into 4 types—communication problems, diagnosis and treatment issues, management problems, and sense of responsibility concerns. The imbalanced data were balanced using the Synthetic Minority Oversampling Technique (SMOTE) algorithm to ensure equal representation across all categories. A total of 3 ML algorithms (Multifactor Logistic Regression, Multinomial Naive Bayes, and Support Vector Machines [SVM]) were used for model training and validation. The best-performing model was tested using a 5-fold cross-validation on external data.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The original dataset consisted of 719, 376, 260, and 86 records for communication problems, diagnosis and treatment issues, management problems, and sense of responsibility concerns, respectively. The Multifactor Logistic Regression and SVM models achieved weighted average accuracies of 0.89 and 0.93 in the training set, and 0.83 and 0.87 in the internal test set, respectively. Ngram-level term frequency–inverse document frequency did not significantly improve classification performance, with only a marginal 1% increase in precision, recall, and <italic>F</italic><sub>1</sub>-score when implementing Ngram-level term frequency–inverse document frequency (n=2) from 0.91 to 0.92. The SVM algorithm performed best in prediction, achieving an average accuracy of 0.91 on the external test set with a 95% CI of 0.87-0.97.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The NLP-driven SVM algorithm demonstrates effective classification performance in automatically categorizing patient complaint texts. It showed superior performance in both internal and external test sets for communication and management problems. However, caution is advised when using it for classifying sense of responsibility complaints. This approach holds promises for implementation in medical institutions with high complaint volumes and limited resources for addressing patient feedback.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>complaint analysis</kwd>
        <kwd>text classification</kwd>
        <kwd>natural language processing</kwd>
        <kwd>NLP</kwd>
        <kwd>machine learning</kwd>
        <kwd>ML</kwd>
        <kwd>patient complaints</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Patient complaints refer to patients feeling dissatisfied or having opinions regarding medical services, treatment processes, medical staff attitudes, or health care institution management during their participation in medical care [<xref ref-type="bibr" rid="ref1">1</xref>]. These complaints are expressed through written or verbal feedback or grievances to relevant organizations or individuals. Complaints can involve various aspects, including medical errors, poor treatment outcomes, unfriendly service attitudes, and excessive waiting times among other issues.</p>
        <p>Handling patient complaints is an essential part of health care institution management, as it can help improve the quality of medical services and enhance patient satisfaction. Patient complaints also serve as valuable sources for gaining insights into safety-related issues within health care institutions. Patients are often more sensitive to a range of issues within medical services compared with health care professionals within the institution. Some of these issues may not be identified by traditional medical surveillance systems [<xref ref-type="bibr" rid="ref2">2</xref>], such as adverse event reporting systems or mortality case reviews. Therefore, patient complaints can provide crucial information for health care institutions on how to improve patient safety.</p>
        <p>Currently, patient satisfaction surveys are conducted through SMS text messages or online methods (such as through a WeChat [Tencent] official account) in our hospital. If a patient responds negatively, a staff member from the outpatient office follows up with a phone call. Under traditional management methods, satisfaction survey personnel meticulously document specific complaints from patients regarding dissatisfaction with the hospital’s medical management. These complaints are then summarized and regularly sent to the hospital’s Patient Advocacy Center (PAC). They are manually categorized and reported every 2 weeks during hospital meetings and also distributed to the email addresses of relevant clinical and medical technology department heads for corrective action and improvement. Only if the patient receives feedback from the relevant department, it will be considered as closing the loop on the complaint-handling process.</p>
        <p>On average, about 25 new complaints are submitted through various channels each day, while the PAC can only analyze and process approximately 10 complaints loops per day. At this rate, it can be estimated that the hospital’s PAC will still have over 5400 patient complaints waiting to be analyzed and addressed within a year. Clearly, without significant changes to the screening and categorization process, the hospital’s PAC will be unable to analyze all submitted complaints within a reasonable timeframe to provide adequate feedback and resolution. The crux of the issue lies in the inability to classify patient complaints in a timely manner, which consequently hampers targeted communication between subsequent departments and patients. This delay leads to patients lodging secondary or even multiple complaints due to prolonged waiting times. In addition, departments with the capability to address specific issues remain idle as they do not receive timely patient complaints. Experience with several hundred such interventions at community and academic medical centers shows fewer subsequent complaints associated with most of those receiving timely and effective feedback [<xref ref-type="bibr" rid="ref3">3</xref>]. Therefore, tardily and ineffectively addressing patient complaints has become a significant bottleneck restricting the enhancement of hospital management quality and medical safety.</p>
        <p>Automatic classification tools play a crucial role in streamlining the triage process, enabling health care providers to efficiently prioritize and address patient concerns based on the severity and nature of their complaints. By automating this classification process, clinicians can allocate resources more effectively, leading to improved patient outcomes and satisfaction. In addition, such tools facilitate the organization and analysis of large volumes of patient data, ultimately contributing to evidence-based decision-making and enhanced health care delivery. The problem is that there are hardly any studies, articles, or systems focusing on the automatic classification of patient complaints. The need for automatic classification of patient complaints is crucial, as manual identification of complaints is inefficient, time-consuming, and highly prone to errors.</p>
        <p>The main contributions of this study are by automating the patient complaint triage process, PAC can allocate resources more efficiently, thereby improving patient care experience and satisfaction. In addition, such tools help organize and analyze large amounts of patient complaint data, ultimately contributing to evidence-based medical decisions and improved medical services to ensure patient treatment safety.</p>
        <p>The structure of the article is as follows. “Existing Approaches to Text Classification” introduces previous studies on existing approaches to text classification and the patients complain auto-classification methodology. “Methods” and “Results” introduce machine learning (ML) models and experimental results. “Discussion” presents an analysis and discussion of selected results and offers some suggestions for future research. Finally, “Conclusion” summarizes our research.</p>
      </sec>
      <sec>
        <title>Existing Approaches to Text Classification</title>
        <p>The classification of patient complaint texts falls within the realm of text auto-classification. Therefore, many previous studies in text classification provide valuable insights for us (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref9">9</xref>]. Especially, auto-classification of texts based on patients’ chief complaints (CC) during the diagnostic process is the most relevant to our research on auto-classifying patient complaint texts.</p>
        <p>CC text classification refers to the task of automatically categorizing or classifying text data based on the main concerns or symptoms expressed by patients when they seek medical attention [<xref ref-type="bibr" rid="ref10">10</xref>]. In principle, each patient complaint should be classified into 1 category, but typically 1 patient complaint may be classified into a single or multiple categories because it contains more than 1 category of disease. A recorded free-text CC is assigned to a category either manually by emergency medicine physicians or other emergency department (ED) professionals, or by using an automated mapping algorithm [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref14">14</xref>]. Automated CC categorization, on the other hand, are more suitable for a wide range of (ED) applications. Traditional automated CC classification algorithms typically use a linear mapping algorithm (keyword search and category matching algorithm [<xref ref-type="bibr" rid="ref15">15</xref>]), or a semantic model based on Bayesian network [<xref ref-type="bibr" rid="ref12">12</xref>].</p>
        <p>The study by Arnaud et al [<xref ref-type="bibr" rid="ref16">16</xref>] leveraged natural language processing (NLP) solutions to predict medical specialties at hospital admission by integrating structured data with unstructured textual notes. An MLP model and a convolutional neural network (CNN) were independently used to achieve promising accuracy in the analysis of over 260,000 ED records. Although the classifier model could only achieve about 68% accuracy of prediction, this research contributes to the growing use of NLP methods in health care analytics. NLP models achieved high accuracy in predicting the need for admission, triage score, critical illness, and mapping free-text CC to structured fields. Incorporating both structured data and free-text data improved results when compared with models that used only structured data. However, the majority of studies (16/20, 80%) were assessed to have a high risk of bias, and only 1 study reported the deployment of an NLP model into clinical practice [<xref ref-type="bibr" rid="ref17">17</xref>].</p>
        <p>These traditional linear classification methods are all based on the bag-of-words (BOW) representation, which treats text as an unordered collection of words, ignoring the position and grammatical structure of words, and only focusing on the frequency of word occurrences. In the BOW model, text is represented as a vector, where each dimension corresponds to a word, and each element of the vector represents the frequency or occurrence of the corresponding word in the text. However, it is known that BOW technique suffers from issues such as loss of word order information, curse of dimensionality, sparsity, and semantic loss. These limitations restrict the performance of the BOW model in NLP tasks [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. Therefore, researchers have proposed various improvement methods to overcome these issues, such as using word embedding techniques and models that consider contextual information [<xref ref-type="bibr" rid="ref20">20</xref>]. A representative work was proposed by Alhazzani et al [<xref ref-type="bibr" rid="ref21">21</xref>], who used pretrained static word embeddings and pretrained vector word embeddings to train deep learning (DL)–based BiLSTM (Bidirectional Long Short-Term Memory) and BiGRU (Bidirectional Gated Recurrent Unit) classifiers. Lee et al [<xref ref-type="bibr" rid="ref13">13</xref>] developed a recurrent neural network (RNN)–based long short-term memory (LSTM) and gated recurrent unit (GRU) cells for text classification [<xref ref-type="bibr" rid="ref13">13</xref>], and they reported that in all instances, the RNN models outperformed the BOW classifiers suggesting DL models could substantially improve the automatic classification of unstructured text for syndromic surveillance.</p>
        <p>Currently, 1 significant innovation using the transformer architecture [<xref ref-type="bibr" rid="ref22">22</xref>] and using bidirectional encoding to effectively capture dependency relationships from both directions of context simultaneously, has significantly propelled technological advancements across various CC text classification tasks [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. The performance of those models (BERT [Bidirectional Encoder Representations from Transformers; Google], Bio_BERT, Clinical BERT, KP_BERT, CC_BERT) was compared with that of the term frequency–inverse document frequency (TF-IDF) [<xref ref-type="bibr" rid="ref25">25</xref>] model serving as the baseline. However, the results revealed that the TF-IDF model outperforms a robust BERT-based model on the test dataset and exhibits statistical comparability in terms of misspelling sets.</p>
        <p>Despite the application of DL methods, including CNNs, RNNs, and BERT, in text categorization—particularly in handling large-scale, high-dimensional data and significantly enhancing text classification performance for complex tasks [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]—traditional ML approaches continue to offer advantages in terms of computational resource requirements and the interpretability of results compared with DL, CNNs, and RNNs. Modern RNNs can have millions of free parameters and thus require huge datasets [<xref ref-type="bibr" rid="ref28">28</xref>]. Training models of this size require significant computing resources. In the task of patient complaints classifying, besides pursuing classification accuracy, the interpretability of ML models should be prioritized. This is because our goal was to identify the root causes of patient complaints through a correct interpretation of classification results, and the interpretability of models such as DL, CNNs, and RNNs is notably low. This significantly undermines the credibility of clinical interpretations of the aforementioned analysis results and their subsequent applicability. Therefore, 3 interpretable common ML classification models (Multifactor Logistic Regression [MLR], Multinomial Naive Bayes [MNB], and Support Vector Machines [SVMs]) are used in our research work.</p>
        <p>By training ML models on large datasets of labeled complaint data, these models can learn to accurately categorize complaints based on their content and context. This automated classification approach can significantly improve the efficiency and accuracy of complaint management systems, reducing reliance on subjective human intervention and enabling faster processing and resolution of patient complaints. In addition, it can help to identify patterns and trends in complaints so that PAC can proactively address common issues and improve overall patient satisfaction.</p>
        <p>In this study, we explore the automatic text classification of patient complaints using 2 types of TF-IDF techniques and trained an ML tool for automatic classification of patient complaint texts written in Chinese based on the existing mature English text automatic classification models.</p>
        <p>We posit that an automated classification architecture for the categorization of patient complaints can be created, which consists of 2 modules.</p>
        <p>First, the NLP module is based on the TF-IDF technique. The function of this module is to perform word frequency and extract features from the patient complaint texts. By using the TF-IDF technique (Word-level TF-IDF and Ngram-level TF-IDF), the importance of each word and semantics in the text can be calculated and keywords representing the core meaning of the complaint can be extracted. This helps the model to better understand and classify the complaint texts.</p>
        <p>Second, the ML module is to classify complaint texts. ML algorithms have been widely adopted for text classification [<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref33">33</xref>]. However, existing research in the literature has primarily focused on the English language. Therefore, patient comments written in Chinese are currently difficult to automatically analyze using traditional ML or statistical approaches. While several classification models based on Chinese text have emerged, their efficacy, algorithmic intricacy, and substantial hardware requirements have impeded the broad implementation of this approach in scholarly discourse [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. The challenge of dealing with Chinese text lies in its complex linguistic features, including character-based writing, tonal variations, and the absence of explicit word boundaries. In addition, Chinese exhibits rich contextual meanings and cultural nuances, which can pose difficulties for NLP tasks such as machine translation, sentiment analysis, and text summarization. By using translation tools (such as ChatGPT 3.5 [OpenAI] or other professional translation tools) to translate Chinese text into English, and then having English professionals review and correct the translated results, these reviewed English texts were used as input data for ML models for classification training. This approach can overcome the challenges of directly processing Chinese text and provides an effective way to use Chinese text data in the test classification process.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Acquisition and Preprocessing Flow</title>
        <p>A retrospective study of patient complaints was conducted at Hangzhou Red Cross Hospital and Hangzhou Cancer Hospital from 2015 to 2019. A comprehensive compilation of 1817 documented complaints were carefully collated. Complaints involving the same patient and the same incident were grouped into 1 independent complaint case. This study was approved by the ethics committee, which granted a waiver of review and exempted it from the informed consent requirement. The data from Hangzhou Red Cross Hospital were used for model training and internal validation, while the data from Hangzhou Cancer Hospital were used for external testing of the model with the best performance in the ML model. All data collection and analysis methods in this study strictly adhere to the “Guidelines for Developing and Reporting Machine Learning Predictive Models in Biomedical Research” [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
        <p>Due to the current difficulty of directly applying ML and classification training to Chinese text, coupled with the availability of mature software and tools for translating Chinese into English, along with the review of translation results by English-proficient graduate students, converting the Chinese written text into English for training purposes is a feasible and efficient approach for automatic text classification. All the texts recorded in Chinese were translated into English by ChatGPT 3.5. Furthermore, 2 postgraduates with English language skills were responsible for reviewing the machine-translated texts; if there were obvious translation errors, the texts were corrected after the 2 individuals proposed unanimous modification suggestions.</p>
        <p>If 2 individuals had a disagreement regarding the translation of the same Chinese word, we would escalate the matter to native English-speaking professors in the International Education Department of the hospital. They would make the final decision to ensure that each identical Chinese word in all Chinese complaint texts was translated into English with complete consistency. To ensure the efficiency of the expert correction mechanism, we have established a reward system. For every flaw or error found in the machine-translated text, a certain amount of funds would be allocated from our project budget for rewards.</p>
        <p>Once sufficient data have been collected, preprocessing is divided into the 3 steps.</p>
        <p>In the first step, the complaint texts are tokenized. After comparing jieba (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendices 2</xref> and <xref ref-type="supplementary-material" rid="app3">3</xref>), THULAC [<xref ref-type="bibr" rid="ref37">37</xref>], and HanLP [<xref ref-type="bibr" rid="ref38">38</xref>], the more mature tool jieba is used in this study. To achieve the best balance between speed and accuracy in tokenization, the Hidden Markov Model Bigram (HMM-Bigram) [<xref ref-type="bibr" rid="ref39">39</xref>] algorithm is used. Part-of-speech tagging is performed at the same time as tokenization. This involves assigning labels to words based on their respective parts of speech, such as adjectives, verbs, nouns, and so on. Part-of-speech tagging is based on maximum entropy and maximum likelihood approaches.</p>
        <p>The second step is to eliminate duplicate parts in the tokenized results and ensure that each word appears only once. In this way, a total vocabulary is generated.</p>
        <p>In the third step, all complaint texts are searched. If a word from the total vocabulary occurs in a particular complaint text, the corresponding position is marked with 1. If it does not appear, it is marked with 0. This creates a matrix with words and tokens as horizontal and vertical axes. Each complaint text can be regarded as a vector of 1s and 0s.</p>
      </sec>
      <sec>
        <title>Feature Extraction</title>
        <p>After preprocessing, feature extraction was adopted before model training. The features are presented in text form, whereby words and phrases with a strong semantic meaning are included as a feature set. The feature set contains most of the information from the entire text, which is beneficial for document classification. Content that is not included in the feature set may result in the loss of some semantic information but has minimal impact on the classification task. Complaint texts usually have a length of 10-100 words and are therefore relatively short. To achieve a relatively accurate classification, the TF-IDF technique was used for the extraction of text features.</p>
        <p>After the preprocessing step, there are still many semantically meaningless particles or signs in the text. For example, “doctor” appears frequently in the text, but its contribution to text classification is relatively small. In addition to the common 841 Chinese stop words, we included an additional 17 frequently occurring but semantically insignificant words from the medical complaint domain into our stop words list based on unanimous recommendations from the staff of our collaborating hospital’s PAC. This decision was made based on our previous experience, as detailed in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>. By including them as stop words, we can focus on more specific and meaningful keywords and thus improve the accuracy and relevance of extracting high-frequency words.</p>
      </sec>
      <sec>
        <title>Semantic Analysis</title>
        <p>Due to the singularity of the environment in which patients complain, the content of the text has a high similarity in terms of scenes and semantics. Therefore, in addition to using Word-level TF-IDF, we also used Ngram-level TF-IDF to examine the impact of consecutive words on the importance of text. Given our dataset’s modest size of approximately 2600 cases and the need for higher granularity in data analysis, the decision was made to use n=2 for Ngram-level TF-IDF.</p>
        <p>After TF-IDF analysis and extension of existing stop words, the problem of particles such as “doctor” can be alleviated, and the feature text is more suitable for the following ML text classification training. For example, the complaint text “Doctor issued unnecessary examination orders for financial reasons” was changed to “unnecessary examination orders financial reasons.” The top 10 high-probability words and word clouds for each type of complaint are calculated and displayed. This step not only allows for an understanding of the basic structure of existing complaint text data but also enables the examination of the correctness of manually labeled complaint texts, preparing necessary groundwork for subsequent model training and verification.</p>
      </sec>
      <sec>
        <title>Unbalanced Data Handling</title>
        <p>The degree of imbalance of dataset is based on the proportion of a minority class in the whole dataset and could range from mild (20%-40%), moderate (1%-20%) to vigorous (&#60;1%) imbalances [<xref ref-type="bibr" rid="ref40">40</xref>]. Previous studies showed that the resampling approach is a useful preprocessing step to handle the imbalanced dataset [<xref ref-type="bibr" rid="ref41">41</xref>]. This method modifies the imbalanced distribution of the majority and minority classes at the data level before training with classifiers. Before training the datasets, we used the Synthetic Minority Oversampling Technique (SMOTE) as an imbalanced adjustment strategy [<xref ref-type="bibr" rid="ref42">42</xref>]. The decision was made due to a moderate dataset imbalance (sense of responsibility/communication problem=11.9%). The datasets of the minority class, including diagnosis and treatment, management problem, and sense of responsibility, were all up sampled to 719. Unlike regular SMOTE, we matched the data volume of minority classes to the majority class through up sampling, while keeping the actual amount of data in the majority class unchanged. This maneuvering minimized the impact on the raw data distribution. One important point to emphasize is that SMOTE only oversamples the internal data used for training and validation, while the independent external data used for testing remains untouched.</p>
      </sec>
      <sec>
        <title>Classification Model Training and Validation</title>
        <p>In order to ensure the consistency of the labeling by the 2 experts, the complaint data were independently labeled by the 2 experts. Secondary annotations for the data of different categories were made by PAC staff from our cooperative hospital, comprising 3 people in total. Finally, the classification results were counted from 5 people for this annotation, and the category that received the most votes was determined as the final complaint classification annotation. We implemented a comparison of several well-known ML classifiers to determine if a supervised ML algorithm can achieve a reasonable classification accuracy compared to the expert rules. The complaint types are “communication problem,” “diagnosis and treatment,” “management problem,” and “sense of responsibility.” The sample counts for each type are shown in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
        <p>In total, 3 ML methods (MLR, MNB, and SVMs) were used to train and validate the model. In the training process, 75% (539/719) of the data in each category were used for training, the rest of 25% (180/719) was used for verification. Another 376 patient complaint records from Hangzhou Cancer Hospital were used for external testing of the trained model with the best performance in the training and verification section. The composition of the 376 patient complaint records is communication problem (n=122), diagnosis and treatment (n=89), management problem (n=85), and sense of responsibility (n=80). The performance of ML algorithms in the training and verification sets is shown in <xref ref-type="table" rid="table2">Table 2</xref>. To assess the generalization ability of the trained model in a more objective manner, a 5-fold cross-validation (CV) was applied to evaluate the model performance during external testing. <xref rid="figure1" ref-type="fig">Figure 1</xref> summarizes the entire process of preprocessing and ML method for patient complaint classification.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Sample number of complaints for each type in the training and verification sets.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="350"/>
            <col width="320"/>
            <col width="330"/>
            <thead>
              <tr valign="bottom">
                <td>Category</td>
                <td>Sample size of raw data</td>
                <td>Sample size after SMOTE<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Communication problem</td>
                <td>719</td>
                <td>719</td>
              </tr>
              <tr valign="top">
                <td>Diagnosis and treatment</td>
                <td>376</td>
                <td>719</td>
              </tr>
              <tr valign="top">
                <td>Management problem</td>
                <td>260</td>
                <td>719</td>
              </tr>
              <tr valign="top">
                <td>Sense of responsibility</td>
                <td>86</td>
                <td>719</td>
              </tr>
              <tr valign="top">
                <td>Total</td>
                <td>1441</td>
                <td>2876</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>SMOTE: Synthetic Minority Oversampling Technique.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Comparison of the performance of 3 machine learning algorithms.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="120"/>
            <col width="0"/>
            <col width="100"/>
            <col width="0"/>
            <col width="120"/>
            <col width="0"/>
            <col width="100"/>
            <col width="0"/>
            <col width="110"/>
            <col width="0"/>
            <col width="100"/>
            <col width="0"/>
            <col width="110"/>
            <col width="0"/>
            <col width="0"/>
            <col width="100"/>
            <col width="0"/>
            <col width="110"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Machine learning models</td>
                <td colspan="4">Communication problem</td>
                <td colspan="4">Diagnosis and treatment</td>
                <td colspan="5">Management problem</td>
                <td colspan="3">Sense of responsibility</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">Training</td>
                <td colspan="2">Validation</td>
                <td colspan="2">Training</td>
                <td colspan="2">Validation</td>
                <td colspan="2">Training</td>
                <td colspan="2">Validation</td>
                <td colspan="3">Training</td>
                <td>Validation</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="19">
                  <bold>MLR<sup>a</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Precision</td>
                <td colspan="2">0.83</td>
                <td colspan="2">0.71</td>
                <td colspan="2">0.89</td>
                <td colspan="2">0.83</td>
                <td colspan="2">0.99</td>
                <td colspan="2">0.97</td>
                <td colspan="3">1.00</td>
                <td colspan="2">0.99</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Recall</td>
                <td colspan="2">0.95</td>
                <td colspan="2">0.91</td>
                <td colspan="2">0.88</td>
                <td colspan="2">0.81</td>
                <td colspan="2">0.94</td>
                <td colspan="2">0.88</td>
                <td colspan="3">0.96</td>
                <td colspan="2">0.89</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td><italic>F</italic><sub>1</sub>-score</td>
                <td colspan="2">0.89</td>
                <td colspan="2">0.80</td>
                <td colspan="2">0.88</td>
                <td colspan="2">0.82</td>
                <td colspan="2">0.96</td>
                <td colspan="2">0.92</td>
                <td colspan="3">0.98</td>
                <td colspan="2">0.94</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Support</td>
                <td colspan="2">160</td>
                <td colspan="2">140</td>
                <td colspan="2">195</td>
                <td colspan="2">183</td>
                <td colspan="2">209</td>
                <td colspan="2">197</td>
                <td colspan="3">210</td>
                <td colspan="2">200</td>
              </tr>
              <tr valign="top">
                <td colspan="19">
                  <bold>SVM<sup>b</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Precision</td>
                <td colspan="2">0.75</td>
                <td colspan="2">0.67</td>
                <td colspan="2">1.00</td>
                <td colspan="2">0.95</td>
                <td colspan="2">1.00</td>
                <td colspan="2">0.99</td>
                <td colspan="3">1.00</td>
                <td colspan="2">1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Recall</td>
                <td colspan="2">1.00</td>
                <td colspan="2">0.98</td>
                <td colspan="2">0.96</td>
                <td colspan="2">0.81</td>
                <td colspan="2">0.98</td>
                <td colspan="2">0.92</td>
                <td colspan="3">0.96</td>
                <td colspan="2">0.92</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td><italic>F</italic><sub>1</sub>-score</td>
                <td colspan="2">0.86</td>
                <td colspan="2">0.80</td>
                <td colspan="2">0.98</td>
                <td colspan="2">0.87</td>
                <td colspan="2">0.99</td>
                <td colspan="2">0.95</td>
                <td colspan="3">0.98</td>
                <td colspan="2">0.96</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Support</td>
                <td colspan="2">167</td>
                <td colspan="2">122</td>
                <td colspan="2">219</td>
                <td colspan="2">210</td>
                <td colspan="2">220</td>
                <td colspan="2">193</td>
                <td colspan="3">209</td>
                <td colspan="2">195</td>
              </tr>
              <tr valign="top">
                <td colspan="19">
                  <bold>MNB<sup>c</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Precision</td>
                <td colspan="2">0.73</td>
                <td colspan="2">0.67</td>
                <td colspan="2">0.98</td>
                <td colspan="2">0.95</td>
                <td colspan="2">1.00</td>
                <td colspan="2">0.99</td>
                <td colspan="3">1.00</td>
                <td colspan="2">1.00</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Recall</td>
                <td colspan="2">1.00</td>
                <td colspan="2">0.98</td>
                <td colspan="2">0.94</td>
                <td colspan="2">0.81</td>
                <td colspan="2">0.96</td>
                <td colspan="2">0.92</td>
                <td colspan="3">0.97</td>
                <td colspan="2">0.92</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td><italic>F</italic><sub>1</sub>-score</td>
                <td colspan="2">0.84</td>
                <td colspan="2">0.80</td>
                <td colspan="2">0.96</td>
                <td colspan="2">0.87</td>
                <td colspan="2">0.98</td>
                <td colspan="2">0.95</td>
                <td colspan="3">0.98</td>
                <td colspan="2">0.96</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Support</td>
                <td colspan="2">134</td>
                <td colspan="2">122</td>
                <td colspan="2">219</td>
                <td colspan="2">210</td>
                <td colspan="2">220</td>
                <td colspan="2">193</td>
                <td colspan="3">219</td>
                <td colspan="2">195</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>MLR: Multifactor Logistic Regression.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>SVM: Support Vector Machine.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>MNB: Multinomial Naive Bayes.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Illustration of the text preprocessing workflow and patient complaint classification model development and validation process. HMM-Bigram: Hidden Markov Model Bigram; MLR: Multifactor Logistic Regression; MNB: Multinomial Naive Bayes; SMOTE: Synthetic Minority Oversampling Technique; SVM: Support Vector Machine; TF-IDF: term frequency–inverse document frequency.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e55721_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>From an ethical standpoint, the present study focused on the examination of public behavior in human subjects. The information collection methods used by the researchers were designed to ensure that subjects could not be directly identified, nor could they be indirectly identified through associated identifiers. To facilitate the effective handling of patient complaints, informed consent was obtained for telephone recordings or written complaints, with access to this information restricted to designated hospital departments. In the context of this research, only the specific content of patient complaints was analyzed, without any extraction or linkage to personal identifiable information. Furthermore, the identities of hospital staff members who were the subjects of complaints were anonymized, with only their departmental affiliation being retained. This approach served to mitigate potential conflicts between complainants and the staff involved. In addition, the potential for harm or discomfort anticipated in the study did not surpass that which individuals might have experienced in daily life or during standard physical and psychological examinations. Consequently, the hospital’s ethics review committee granted a waiver of review for this research.</p>
        <p>The study was carried out in compliance with the Declaration of Helsinki and received ethical approval as a waiver of review from the Ethics Committee of Hangzhou Red Cross Hospital.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Overview</title>
        <p>In our investigation, we discovered that out of 1817 patient complaints, approximately 23 cases, accounting for 1.3% of the total, required modification post translation by ChatGPT 3.5 to avoid potential ambiguity. Among these cases, communication problem accounted for 7 instances, diagnosis and treatment only had 1, management problem had 4, while sense of responsibility constituted 11 cases. Most ambiguities were concentrated within communication problem and sense of responsibility categories, with relatively fewer occurrences in the more objective diagnosis and treatment and Management Problem categories. This observation may be attributed to the inherent difficulty patients encounter in articulating issues related to communication problem and sense of responsibility, compared with the relatively straightforward nature of diagnosis and treatment and management problem categories.</p>
        <p>The HMM-Bigram algorithm was used for part-of-speech tagging. For the input text: “General surgery patients complained that unnecessary examination items were applied by the doctor,” the tagging results are as follows: [(‘General’, ‘JJ-TL’), (‘surgery’, ‘NN’), (‘patients’, ‘NNS’), (‘complained’, ‘VBD’), (‘that’, ‘DT’), (‘doctor’, ‘NN’), (‘applied’, ‘VBN’), (‘unnecessary’, ‘JJ’), (‘examination’, ‘NN’), (‘items’, ‘NNS’), (‘performance’, ‘NN’), (‘commissions’, ‘NNS’)]. Each tag consists of 2 parts, the first being the word itself, and the second being the part-of-speech tag for that word. For example, in the first tag of the results (‘General’, ‘JJ-TL’), “General” is the word, and “JJ-TL” is its part-of-speech tag. In this tag, “JJ” indicates an adjective, while “TL” represents the word’s tag in the Brown Corpus. Similarly, (‘surgery’, ‘NN’) indicates that “surgery” is a noun.</p>
        <p>The following image (<xref rid="figure2" ref-type="fig">Figure 2</xref>) illustrates a matrix with words and tokens as horizontal and vertical axes with the HMM-Bigram algorithm.</p>
        <p>In the methodology section, 2 methods, Word-level TF-IDF and Ngram-level TF-IDF (with n=2), were used for feature extraction from the text. The TF-IDF values and their performance on the training and verification sets are shown in <xref rid="figure3" ref-type="fig">Figure 3</xref> and <xref ref-type="table" rid="table3">Table 3</xref>, respectively.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Illustration of a matrix with words and tokens as horizontal and vertical axes with the Hidden Markov Model Bigram token algorithm.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e55721_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Comparison of the term frequency–inverse document frequency values between Word-level and Ngram-level term frequency–inverse document frequency (with n=2). TF-IDF: term frequency–inverse document frequency.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e55721_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Classification results comparison of Word-level term frequency–inverse document frequency and Ngram-level term frequency–inverse document frequency (n=2).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="290"/>
            <col width="90"/>
            <col width="90"/>
            <col width="0"/>
            <col width="90"/>
            <col width="90"/>
            <col width="0"/>
            <col width="90"/>
            <col width="90"/>
            <col width="0"/>
            <col width="90"/>
            <col width="80"/>
            <thead>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Precision</td>
                <td colspan="3">Recall</td>
                <td colspan="3"><italic>F</italic><sub>1</sub>-score</td>
                <td colspan="2">Support</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>WL<sup>a</sup></td>
                <td>NL<sup>b</sup></td>
                <td colspan="2">WL</td>
                <td>NL</td>
                <td colspan="2">WL</td>
                <td>NL</td>
                <td colspan="2">WL</td>
                <td>NL</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Communication problem</td>
                <td>0.73</td>
                <td>0.74</td>
                <td colspan="2">0.95</td>
                <td>0.95</td>
                <td colspan="2">0.82</td>
                <td>0.83</td>
                <td colspan="2">138</td>
                <td>140</td>
              </tr>
              <tr valign="top">
                <td>Management problem</td>
                <td>0.93</td>
                <td>0.93</td>
                <td colspan="2">0.89</td>
                <td>0.88</td>
                <td colspan="2">0.91</td>
                <td>0.91</td>
                <td colspan="2">189</td>
                <td>189</td>
              </tr>
              <tr valign="top">
                <td>Diagnosis and treatment</td>
                <td>0.99</td>
                <td>0.99</td>
                <td colspan="2">0.89</td>
                <td>0.9</td>
                <td colspan="2">0.94</td>
                <td>0.94</td>
                <td colspan="2">201</td>
                <td>200</td>
              </tr>
              <tr valign="top">
                <td>Sense of responsibility</td>
                <td>1</td>
                <td>1</td>
                <td colspan="2">0.94</td>
                <td>0.94</td>
                <td colspan="2">0.97</td>
                <td>0.97</td>
                <td colspan="2">192</td>
                <td>191</td>
              </tr>
              <tr valign="top">
                <td>Accuracy</td>
                <td>—<sup>c</sup></td>
                <td>—</td>
                <td colspan="2">—</td>
                <td>—</td>
                <td colspan="2">0.91</td>
                <td>0.92</td>
                <td colspan="2">720</td>
                <td>720</td>
              </tr>
              <tr valign="top">
                <td>Macro average</td>
                <td>0.91</td>
                <td>0.92</td>
                <td colspan="2">0.92</td>
                <td>0.92</td>
                <td colspan="2">0.91</td>
                <td>0.91</td>
                <td colspan="2">720</td>
                <td>720</td>
              </tr>
              <tr valign="top">
                <td>Weighted average</td>
                <td>0.93</td>
                <td>0.93</td>
                <td colspan="2">0.91</td>
                <td>0.92</td>
                <td colspan="2">0.92</td>
                <td>0.92</td>
                <td colspan="2">720</td>
                <td>720</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>Word-level term frequency–inverse document frequency.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>Ngram-level term frequency–inverse document frequency.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>Not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Semantic Analysis</title>
        <p>A total of 4 complaint categories underwent preprocessing after incorporating expended stop words to enhance the specificity of medical complaints. This process generated high-frequency word histograms, and the word frequency analysis results for the 4 types of complaints will be uploaded as supplementary files (Multimedia Appendices). The top 3 vocabulary words in the category of “communication problem” are “explanation,” “enough,” and “believes.” In the category of “diagnosis and treatment” complaints, apart from “diagnosis and treatment” itself, the main concerns were “effect,” “pediatric,” and “emergency.” In the category of “management problem” complaints, the primary content revolves around “clinic,” “waiting,” and “time.” As for the category of “sense of responsibility,” the prominent content includes “medicine,” “back,” and “went.”</p>
      </sec>
      <sec>
        <title>Performance of Patient Complaint Classification Models</title>
        <p>The performance of 3 ML models in the training and validation sets was demonstrated in <xref ref-type="table" rid="table2">Table 2</xref> (for more detailed data including the 95% CIs for each metric, please refer to <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>). It was found that MLR achieved the best performance in classifying the communication problem, as assessed by <italic>F</italic><sub>1</sub>-score. However, in the classification tasks of the remaining 3 categories, SVM outperformed MLR and MNB, comprehensively. Furthermore, from the training and validation iteration process, it can be observed that the model began to converge well by the eighth epoch (<xref rid="figure4" ref-type="fig">Figures 4</xref> and <xref rid="figure5" ref-type="fig">5</xref>). In addition, the best model achieved very high receiver operating characteristic (ROC) values (ROC&#62;0.97) in classifying the 4 types on the test set. Hence, the SVM algorithm was adopted for the subsequent external data validation section with a 5-fold CV method applied. A more detailed comparison of the point estimate and 95% CIs for each model’s performance metrics has been included in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Demonstration of training and validation performance in machine learning iteration process. Training and validation performance of Support Vector Machine. acc: accuracy.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e55721_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Training and validation performance of Support Vector Machine (receiver operating characteristic curve). ROC: receiver operating characteristic.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e55721_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Stability of Model Iteration Process</title>
        <p>To monitor the stability of the model’s training effects during the machine-learning process, we set a maximum iteration number of 30. It was found that all ML algorithms perfectly converged in the first 20 iterations, and the MLR had the most stable output and the best generalization performance during the training and validation iterations (<xref rid="figure6" ref-type="fig">Figures 6</xref>-<xref rid="figure8" ref-type="fig">8</xref>). However, due to the use of the SGD (Stochastic Gradient Descent) algorithm, the SVM algorithm tended to output significantly fluctuating results during the training process (<xref rid="figure4" ref-type="fig">Figures 4</xref> and <xref rid="figure5" ref-type="fig">5</xref>). Although the MNB algorithm performed well on the training set, it exhibited overfitting and mediocre generalization ability on the test set (<xref rid="figure9" ref-type="fig">Figures 9</xref> and <xref rid="figure10" ref-type="fig">10</xref>).</p>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Demonstration of training and validation performance in machine learning iteration process. Confusion matrix of Multinomial Naive Bayes, Logistic Regression, and Support Vector Machine in testing set. svm: Support Vector Machine.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e55721_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>Demonstration of training and validation performance in machine learning iteration process. Training and validation performance of Multinomial Naive Bayes. acc: accuracy.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e55721_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure8" position="float">
          <label>Figure 8</label>
          <caption>
            <p>Training and validation performance of Multinomial Naive Bayes (receiver operating characteristic curve). ROC: receiver operating
characteristic.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e55721_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure9" position="float">
          <label>Figure 9</label>
          <caption>
            <p>Demonstration of training and validation performance in machine learning iteration process. Training and validation performance of Multifactor Logistic Regression. acc: accuracy.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e55721_fig9.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure10" position="float">
          <label>Figure 10</label>
          <caption>
            <p>Training and validation performance of Multifactor Logistic Regression (receiver operating characteristic curve). ROC: receiver operating
characteristic.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e55721_fig10.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Performance of the 5-Fold SVMs Algorithm on the External Test Dataset</title>
        <p>It was inspiring to see that the SVM classification algorithm achieved a commendable result in accurately categorizing 3 distinct types of patient complaints (communication problem, diagnosis, treatment, and management problem) on the external test dataset. The average area under the curve (AUC) for these 3 types was 0.94, 0.86, and 0.81, respectively, with an average SD below 0.1 in all 3 types of patient complaints (<xref rid="figure11" ref-type="fig">Figures 11</xref>-<xref rid="figure13" ref-type="fig">13</xref>). However, the average AUC for the sense of responsibility category was only 0.7 (in the 5-fold testing, the minimum AUC is 0.48, and the maximum AUC is only 0.82; <xref rid="figure14" ref-type="fig">Figure 14</xref>).</p>
        <fig id="figure11" position="float">
          <label>Figure 11</label>
          <caption>
            <p>A 5-fold cross-validation curve of receiver operating characteristic of Support Vector Machine on the external test data set. Receiver
operating characteristic for communication problem classification. AUC: area under the curve; ROC: receiver operating characteristic.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e55721_fig11.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure12" position="float">
          <label>Figure 12</label>
          <caption>
            <p>A 5-fold cross-validation curve of receiver operating characteristic of Support Vector Machine on the external test data set. Receiver
operating characteristic for diagnosis and treatment problem classification. AUC: area under the curve; ROC: receiver operating characteristic.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e55721_fig12.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure13" position="float">
          <label>Figure 13</label>
          <caption>
            <p>A 5-fold cross-validation curve of receiver operating characteristic of Support Vector Machine on the external test data set. Receiver
operating characteristic for management problem classification. AUC: area under the curve; ROC: receiver operating characteristic.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e55721_fig13.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure14" position="float">
          <label>Figure 14</label>
          <caption>
            <p>A 5-fold cross-validation curve of receiver operating characteristic of Support Vector Machine on the external test data set. Receiver
operating characteristic for sense of responsibility problem classification. AUC: area under the curve; ROC: receiver operating characteristic.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e55721_fig14.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Ambiguities arise more frequently in areas where patients may struggle to clearly articulate their concerns, particularly in subjective categories like communication and responsibility. Word-level TF-IDF proved sufficient for our needs. The result also revealed that Ngram-level methods did not significantly enhance model performance, even after optimal tuning of N. The NLP-driven SVM algorithm effectively classifies patient complaint texts, demonstrating superior performance in both internal and external test sets for communication and management problems.</p>
      </sec>
      <sec>
        <title>Related Systems for Patient Complaints Text Classification</title>
        <p>Traditional text classification relies on hand-coded keyword-based methods suffer from low efficiency and accuracy. The manual creation of these classifiers (often in the form of expert rules) is a difficult and expensive process [<xref ref-type="bibr" rid="ref43">43</xref>] that requires the coordinated work of medical experts and knowledge engineers. To the best of our knowledge, there are currently 3 manual approaches to classifying patient complaint texts: The first one is Patient Advocacy Reporting System (PARS), the second mainly focused on Healthcare Complaint Analysis Tool (HCAT [<xref ref-type="bibr" rid="ref44">44</xref>]), developed by UK researchers Alex Gillespie and Tom Reader, and the last one is based on the use of the qualitative analysis software NVivo [<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref46">46</xref>], launched by the Australian company QSR (now Lumivero). However, both HCAT and NVivo require human classification at various stages of the classification process. Therefore, these methods are at best semiautomatic means for text classification. They have not yet fully solved the problem of manual intervention in the classification process [<xref ref-type="bibr" rid="ref47">47</xref>].</p>
      </sec>
      <sec>
        <title>Ngram-Level TF-IDF Failed to Enhance Classification Performance</title>
        <p>As gleaned from <xref ref-type="table" rid="table3">Table 3</xref>, the increment in precision, recall, and <italic>F</italic><sub>1</sub>-score with Ngram-level TF-IDF (n=2) merely amounted to 1%, rising from 0.91 to 0.92. The reason analysis for why Ngram-level TF-IDF (n=2) did not improve the classification performance of Word-level TF-IDF could be as described further. First, the primary reason might be Ngram-level TF-IDF with n=2 considers pairs of words, capturing some contextual information. However, this may not always lead to significant improvements, especially when text prone to ambiguity undergoes review by language experts, the additional information obtainable from conjunctions becomes relatively limited. The second possible reason was Ngram-level TF-IDF, particularly with smaller datasets (only 2157 cases for training), which could be prone to overfitting. It might capture too much noise or specific patterns from the training data that did not generalize well to unseen data, resulting in worse performance on the test set. For tuning the parameter of Ngram-level TF-IDF, we used the MNB method and set N to values ranging from 1 to 5. The results were depicted in <xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>. It can be observed that when N=1, the model achieved its maximum values for precision, recall, and <italic>F</italic><sub>1</sub>-score. Consequently, N=1 for Ngram-level TF-IDF corresponds to using Word-level TF-IDF.</p>
      </sec>
      <sec>
        <title>The Feasibility of Using ChatGPT as a Bulk Translation Tool</title>
        <p>The process of translating patient complaints into English through ChatGPT could potentially introduce several issues into the classification, especially concerning the accuracy of translation. Common knowledge holds by European and American litterateurs that translating ancient Chinese poetry into English is extremely challenging. However, in a study reported by Gao et al [<xref ref-type="bibr" rid="ref48">48</xref>], they compared the performances of ChatGPT with Google Translate and DeepL Translator in translating Chinese classical poetry in terms of fidelity, fluency, language style, and machine translation style. The results revealed that ChatGPT outperformed Google Translate and DeepL Translator in all evaluation criteria. Therefore, in our research, the difficulty level of the Chinese text of patient complaints was significantly lower compared with classical poetry. The texts were generally very clear and complete, containing specific elements and structures such as precise time, location, individuals involved, and events. As the complainants were patients and their family members, the language was relatively common, devoid of esoteric medical terminology. Consequently, for ChatGPT 3.5, the translation results were very close to the outcomes of human translations. In addition, 2 postgraduates with English language skills were responsible for reviewing the machine-translated texts. If there were obvious translation errors, the texts were corrected after the 2 individuals proposed unanimous modification suggestions. Therefore, we believe that at least using ChatGPT 3.5 for translating bulk of simple complaint texts into English was acceptable and efficient, as we did not have to struggle with balancing the accuracy and efficiency of the translation.</p>
      </sec>
      <sec>
        <title>Appropriate Number and Types of Categories</title>
        <p>Reader et al [<xref ref-type="bibr" rid="ref49">49</xref>] developed a coding taxonomy for analyzing patient complaints. The subcategories were thematically grouped into 7 categories and then 3 conceptually distinct domains. Their “3-domain” classification system is similar to our “4-category” one. For instance, “the safety and quality of clinical care” corresponds to our “diagnosis and treatment,” “management of health care organizations” corresponds to our “management problem,” and “healthcare staff-patient relationships” corresponds to our “communication problem” and “sense of responsibility.”</p>
        <p>We subdivided “healthcare staff-patient relationships” into 2 categories because it was considered that communication issues were skill-related problems that can be addressed through targeted training. At the same time, the sense of responsibility is a matter of the staff’s character that requires long-term education and may even necessitate stricter rewards and penalties to improve. They also reported that the most common issues complained about were “treatment” (113,738/88,069, 15.6%) and “communication” (12,065/88,069, 13.7%). However, our research shows that complaints mainly stem from “communication” (719/1465, 49.9%) and “diagnosis and treatment” (376/1465, 26.1%), respectively. However, when focusing on categorizing complaints, we must analyze the data sources, as there can be significant differences between patient complaint data from specialized hospitals and data from comprehensive hospitals. Even within the same hospital, there can be significant variations in complaint data between different departments.</p>
        <p>Another similar research carried out by HaCohen-Kerner et al [<xref ref-type="bibr" rid="ref50">50</xref>], showed that their study attempted to reduce the number of categories for automatic text classification from 7 to 4 across 2073 samples. The predictive model’s performance reached its peak accuracy (93.8%) on the test set when the number of categories was reduced to 4. Therefore, it was reasonable in our research to limit the predicted categories to 4 in similar sample sizes.</p>
      </sec>
      <sec>
        <title>Optimal Number of Folds to Use in a K-Fold Cross-Validation in External Dataset</title>
        <p>It is well-accepted that larger k means less bias toward overestimating the true expected error but higher variance and higher running time. In both of these cases, selecting k depends on the same thing. We must ensure that the training set and testing set are drawn from the same distribution and that both sets contain sufficient variation such that the underlining distribution is represented. The problem we encountered involved using training and verification data sourced from a general hospital and external test data from a specialized cancer hospital. Discrepancies in patient treatment expectations and compliance between the 2 hospitals may introduce biases in the distribution of complaint data. Consequently, we opted to use CV testing during external testing to mitigate the potential impact of these factors on data representation.</p>
        <p>Selecting k is not an exact science because it is challenging to find a balance in a fold of data that effectively represents the overall dataset while also minimizing data bias. We try to use a 5-fold cross validation, in this case, with approximately 75 (376×0.2) instances per fold, conducting 10-folds CV would result in only about 37 instances per fold. As a result, all 4 types of complaints may not be encompassed within a single fold. However, if our dataset size increases dramatically, like if we have over 10,000 instances, a 10-fold cross validation would lead in folds of 1000 instances. In a related work carried by Oyedele [<xref ref-type="bibr" rid="ref51">51</xref>], a bigger independent testing set of size 10,000 (independently sampled from the same distribution and using the same parameters with 5000 samples per class) was created in order to estimate the performance (ie, error probability) of the network. Therefore, for a task with 2 classifications and 10,000 samples, they adopt a 10-fold CV, which poses much less risk of bias in the results compared with our 5-fold CV approach.</p>
      </sec>
      <sec>
        <title>Advantages of Using TF-IDF and SVM for Patient Complaint Text Classification</title>
        <p>Elmessiry et al [<xref ref-type="bibr" rid="ref52">52</xref>] compared a text classification method using 6 ML classifiers and suggested that the TF-IDF–based random forest classification algorithm has advantages in text classification both in accuracy and <italic>F</italic><sub>1</sub>-score. However, based on their results, the achieved accuracy, <italic>F</italic><sub>1</sub>-score, sensitivity, and specificity in correctly classifying patient complaints were relatively low, with values of 82%, 81%, 0.76, and 0.87 respectively.</p>
        <p>Previous studies have used ML algorithms such as SVMs [<xref ref-type="bibr" rid="ref53">53</xref>], Logistic Regression [<xref ref-type="bibr" rid="ref54">54</xref>], and Naive Bayes classifiers [<xref ref-type="bibr" rid="ref55">55</xref>] for classification purposes [<xref ref-type="bibr" rid="ref56">56</xref>]. Compared with other ML algorithms, the SVM algorithm has demonstrated superior performance in text classification, which aligns closely with our research findings. The strong generalization capability of SVM in high-dimensional feature spaces can be credited for their effectiveness in text classification tasks. SVMs eliminate the need for feature selection, simplifying the classification process. Their regularization parameters help prevent overfitting, making them robust in handling noisy data and datasets with many features. In addition, SVMs are efficient in processing small to medium-sized datasets, producing reliable performance even with limited training data. Our research also confirmed that, even with very limited sample sizes, such as in the cases of “management problem” and “sense of responsibility” with raw data sizes of only 260 and 86, the SVM algorithm achieved average AUC scores of 0.81 and 0.7, respectively, in external test sets.</p>
        <p>In the text preprocessing and ML section, we used the pipeline training architecture, which can be seen as a tool to connect multiple data processing and model training steps. It allows users to combine multiple operations in a specific order to form a complete flow and ensures data flows between each operation. Through pipeline, data preprocessing, feature engineering, model training, model evaluation, and other steps can be organically combined into a complete ML process. The advantage of doing this is improving code maintainability and reusability, making it easier to perform the same workflow on different datasets and better managing dependencies between each step.</p>
        <p>We initialized SVM parameters as listed in <xref ref-type="supplementary-material" rid="app8">Multimedia Appendix 8</xref> and adopted a fine-tuning with genetic algorithm–SVM as proposed by Ali et al [<xref ref-type="bibr" rid="ref57">57</xref>] and Nair et al [<xref ref-type="bibr" rid="ref58">58</xref>], which has the best model performance while keeping a reasonable optimization time. The detailed tuning process and prediction results before and after tuning have been illustrated in <xref ref-type="supplementary-material" rid="app9">Multimedia Appendices 9</xref> and <xref ref-type="supplementary-material" rid="app10">10</xref>).</p>
      </sec>
      <sec>
        <title>ML Model Selection Strategy</title>
        <p>A critical consideration is the balance between model accuracy and model simplicity or interpretability. High accuracy is essential for a model’s effectiveness, especially in scenarios that rely on making correct predictions. While complex models (such as DL or ensemble methods) can achieve higher accuracy due to their ability to capture intricate patterns in the data, they often require large amounts of data and substantial computational resources. Models with high interpretability foster trust and accountability, as stakeholders can see and understand how decisions are made. However, there is a trade-off here; complex models may exhibit lower bias but higher variance, meaning they might fit the training data very well but perform poorly on unseen data due to overfitting. Conversely, simpler models tend to have higher bias, potentially missing significant patterns in the data, but they perform more consistently across different datasets.</p>
        <p>In this study, a hybrid strategy was adopted in ML model selection. In the first stage, 3 ML algorithms (MLR, MNB, and SVM) were used for model training and validation. In the second stage, the best-performing model was tested using 5-fold CV on external data. Ultimately, the choice of model should be guided by the specific context of the problem, including the importance of accuracy versus interpretability, the stakes involved, and the audience for the model outputs. In the specific task of patient complaint classification, we prioritize the generalization ability of the model, which means achieving the best prediction accuracy on unseen data. This preference is crucial because if the model’s generalization is insufficient, misclassified complaint cases will require more human effort to resolve, and the resulting delay in complaint resolution might exacerbate patient-doctor conflicts and disputes.</p>
      </sec>
      <sec>
        <title>Limitations and Further Research Directions</title>
        <p>In this study, the original data were initially in Microsoft Excel format, and each row of complaint content was separately saved as a text file before subsequent data cleaning and analysis were performed. Consequently, similar processing was required during application to ensure compatibility with the model. Failure to align the actual input data format with that of the model could lead to the inability of the model to predict outcomes correctly. Therefore, in subsequent work, a complaint text organization code will be developed to support both individual complaint text prediction through copy-and-paste operations and batch text processing.</p>
        <p>It is noteworthy that despite ultimately selecting the SVM algorithm for validating external data, it displayed consistent fluctuations in learning accuracy and verification loss throughout in training iteration. We attempted to improve the situation by reducing the learning rate from 0.5 to 0.1, but this did not yield positive results. After ruling out factors such as randomness and model complexity, we speculate that it is likely due to the SVM algorithm using SGD optimization, which can cause the model to converge to local minimum or exhibit more significant fluctuations in results. Another possibility may be the imbalance in our raw data distribution, with the third class, “management problem,” and the fourth class, “sense of responsibility,” having too few data samples.</p>
        <p>The primary challenge addressed in this study pertains to the imbalanced distribution of raw data and the limited dataset size. Although we used SMOTE to adjust for imbalanced data, the synthetic samples generated by SMOTE may introduce noise or distortions into the dataset, potentially leading to information loss and affecting the classifier’s performance on the minority class. To address this issue, our future work will involve collaborative efforts with multiple hospitals to enhance data volume. Furthermore, as is well-known, more advanced NLP models (eg, BERT) provide contextual understanding, enabling them to grasp complex relationships within text and improve analysis accuracy and depth. As a future direction for our work, we plan to develop a user-friendly graphical user software interface powered by BERT to facilitate the classification and management of complaints by PAC personnel.</p>
        <p>Another issue that must be stated is that the semantic features extracted using NLP technology are quite different from the common scenarios based on explicit independent and dependent variables. In ML problems with clear relationships between independent and dependent variables, it is possible to rank the importance of independent variables, as these features have stable meanings themselves. However, semantic features are influenced by the linguistic context, meaning that the same word can have different meanings in different language environments and contexts. Therefore, our results cannot pinpoint which specific words significantly influence the classification of complaint text types.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>The NLP combined SVM algorithm performs well in automatically categorizing patient complaint texts. Furthermore, it has the best performance in both internal and external test sets for communication and management problems. However, caution is necessary when used for the classification of sense of responsibility. It has excellent prospects for application in medical institutions with many complaints and a shortage of medical-patient processing specialists.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Review and Prospect of Multi-Label Text Classification Research.</p>
        <media xlink:href="jmir_v27i1e55721_app1.pdf" xlink:title="PDF File  (Adobe PDF File), 2923 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>A method and system for classifying short text of product names based on attention mechanism: Part a.</p>
        <media xlink:href="jmir_v27i1e55721_app2.pdf" xlink:title="PDF File  (Adobe PDF File), 2989 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>A method and system for classifying short text of product names based on attention mechanism: Part b.</p>
        <media xlink:href="jmir_v27i1e55721_app3.pdf" xlink:title="PDF File  (Adobe PDF File), 2979 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>High frequency but meaningless stop words related to medical complaints.</p>
        <media xlink:href="jmir_v27i1e55721_app4.docx" xlink:title="DOCX File , 18 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Comparison of the Performance of Three Machine Learning Algorithms: Point Estimate and 95% Confidence Intervals.</p>
        <media xlink:href="jmir_v27i1e55721_app5.docx" xlink:title="DOCX File , 20 KB"/>
      </supplementary-material>
      <supplementary-material id="app6">
        <label>Multimedia Appendix 6</label>
        <p>Point Estimate and 95% CIs of each model’s performance metrics in distinguishing the four categories.</p>
        <media xlink:href="jmir_v27i1e55721_app6.docx" xlink:title="DOCX File , 19 KB"/>
      </supplementary-material>
      <supplementary-material id="app7">
        <label>Multimedia Appendix 7</label>
        <p>Precision, Recall, and F1-score on different N in Ngram-level TF-IDF (term frequency–inverse document frequency).</p>
        <media xlink:href="jmir_v27i1e55721_app7.png" xlink:title="PNG File , 367 KB"/>
      </supplementary-material>
      <supplementary-material id="app8">
        <label>Multimedia Appendix 8</label>
        <p>Initialized Support Vector Machine parameters.</p>
        <media xlink:href="jmir_v27i1e55721_app8.docx" xlink:title="DOCX File , 18 KB"/>
      </supplementary-material>
      <supplementary-material id="app9">
        <label>Multimedia Appendix 9</label>
        <p>The fine tuning hyperparameters.</p>
        <media xlink:href="jmir_v27i1e55721_app9.png" xlink:title="PNG File , 4420 KB"/>
      </supplementary-material>
      <supplementary-material id="app10">
        <label>Multimedia Appendix 10</label>
        <p>The fine tuning hyperparameters.</p>
        <media xlink:href="jmir_v27i1e55721_app10.png" xlink:title="PNG File , 3965 KB"/>
      </supplementary-material>
      <supplementary-material id="app11">
        <label>Multimedia Appendix 11</label>
        <p>Core Python code used in this study.</p>
        <media xlink:href="jmir_v27i1e55721_app11.rar" xlink:title="RAR File , 14 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUC</term>
          <def>
            <p>area under the curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">BERT</term>
          <def>
            <p>Bidirectional Encoder Representations from Transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">BiGRU</term>
          <def>
            <p>Bidirectional Gated Recurrent Unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">BiLSTM</term>
          <def>
            <p>Bidirectional Long Short-Term Memory</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">BOW</term>
          <def>
            <p>bag-of-words</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">CC</term>
          <def>
            <p>chief complaints</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">CNN</term>
          <def>
            <p>convolutional neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">CV</term>
          <def>
            <p>cross-validation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">DL</term>
          <def>
            <p>deep learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">ED</term>
          <def>
            <p>emergency department</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">GRU</term>
          <def>
            <p>gated recurrent unit</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">HMM-Bigram</term>
          <def>
            <p>Hidden Markov Model Bigram</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">HCAT</term>
          <def>
            <p>Healthcare Complaint Analysis Tool</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">LSTM</term>
          <def>
            <p>long short-term memory</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">MLR</term>
          <def>
            <p>Multifactor Logistic Regression</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb17">MNB</term>
          <def>
            <p>Multinomial Naive Bayes</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb18">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb19">PAC</term>
          <def>
            <p>Patient Advocacy Center</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb20">PARS</term>
          <def>
            <p>Patient Advocacy Reporting System</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb21">RNN</term>
          <def>
            <p>recurrent neural networks</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb22">ROC</term>
          <def>
            <p>receiver operating characteristic</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb23">SGD</term>
          <def>
            <p>Stochastic Gradient Descent</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb24">SMOTE</term>
          <def>
            <p>Synthetic Minority Oversampling Technique</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb25">SVM</term>
          <def>
            <p>Support Vector Machine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb26">TF-IDF</term>
          <def>
            <p>term frequency–inverse document frequency</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This research was funded by the Natural Science Foundation of Zhejiang Province, China (grant LGF22H220007); and Hangzhou Health Science and Technology Project, China (grant A20200746).</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>Data that support the findings of the study are available upon request from the corresponding author.</p>
        <p>In addition, we have provided the important Python code related to this study in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 11</xref> for interested readers to download and use.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>Conceptualization was contributed by X Li, X Lou, and XF. Methodology was contributed by CK and GL. Validation was contributed by X Lou. Formal analysis was contributed by X Li. Writing—review and editing was contributed by XF. All authors have read and agreed to the published version of the manuscript. Authors GY (yugbme@zju.edu.cn) and XL (lxd2019@zju.edu.cn) are co-corresponding authors for this article.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yoder-Wise</surname>
              <given-names>PS</given-names>
            </name>
          </person-group>
          <article-title>Patient complaints: not ours to own, but ours to fix</article-title>
          <source>J Contin Educ Nurs</source>
          <year>2015</year>
          <volume>46</volume>
          <issue>12</issue>
          <fpage>531</fpage>
          <lpage>532</lpage>
          <pub-id pub-id-type="doi">10.3928/00220124-20151112-01</pub-id>
          <pub-id pub-id-type="medline">26641145</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wofford</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Wofford</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Bothra</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kendrick</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lichstein</surname>
              <given-names>PR</given-names>
            </name>
          </person-group>
          <article-title>Patient complaints about physician behaviors: a qualitative study</article-title>
          <source>Acad Med</source>
          <year>2004</year>
          <volume>79</volume>
          <issue>2</issue>
          <fpage>134</fpage>
          <lpage>138</lpage>
          <pub-id pub-id-type="doi">10.1097/00001888-200402000-00008</pub-id>
          <pub-id pub-id-type="medline">14744713</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hardavella</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Aamli-Gaagnat</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Saad</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Rousalova</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Sreter</surname>
              <given-names>KB</given-names>
            </name>
          </person-group>
          <article-title>How to give and receive  feedback effectively</article-title>
          <source>Breathe (Sheff)</source>
          <year>2017</year>
          <volume>13</volume>
          <issue>4</issue>
          <fpage>327</fpage>
          <lpage>333</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29209427"/>
          </comment>
          <pub-id pub-id-type="doi">10.1183/20734735.009917</pub-id>
          <pub-id pub-id-type="medline">29209427</pub-id>
          <pub-id pub-id-type="pii">EDU-0099-2017</pub-id>
          <pub-id pub-id-type="pmcid">PMC5709796</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>4</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Zhang, X. Xi, Z. Cui, Y. Zou and J</article-title>
          <source>Review and Prospect of Multi-Label Text Classification Research</source>
          <year>2023</year>
          <access-date>2023-12-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://caod.oriprobe.com/articles/65876090/Review_and_Prospect_of_Multi_Label_Text_Classifica.htm">https://caod.oriprobe.com/articles/65876090/Review_and_Prospect_of_Multi_Label_Text_Classifica.htm</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>A method for classifying information in education policy texts based on an improved attention mechanism model</article-title>
          <source>Wirel. Commun. Mob. Comput</source>
          <year>2022</year>
          <volume>2</volume>
          <issue>1</issue>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://onlinelibrary.wiley.com/doi/epdf/10.1155/2022/5467572"/>
          </comment>
          <pub-id pub-id-type="doi">10.1155/2022/5467572</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>6</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Schopf, D</article-title>
          <year>2023</year>
          <month>1</month>
          <day>18</day>
          <conf-name>Braun and F.  Matthes17th International Conference on Web Information Systems and Technologies (WEBIST) Electr Network 2023 Oct  2021 2023 Pages</conf-name>
          <conf-date>Oct 26, 2021 - Oct 28, 2021</conf-date>
          <conf-loc>Valletta, Malta</conf-loc>
          <pub-id pub-id-type="doi">10.1007/978-3-031-24197-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Review of text classification methods on deep learning</article-title>
          <source>Cmc-Computers Materials &#38; Continua</source>
          <year>2020</year>
          <volume>63</volume>
          <issue>3</issue>
          <fpage>1309</fpage>
          <lpage>1321</lpage>
          <pub-id pub-id-type="doi">10.32604/cmc.2020.010172</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yao</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Application of improved distributed naive Bayesian algorithms in text classification</article-title>
          <source>J Supercomput</source>
          <year>2019</year>
          <volume>75</volume>
          <issue>3</issue>
          <fpage>5831</fpage>
          <lpage>5847</lpage>
          <pub-id pub-id-type="doi">10.1007/s11227-019-02862-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Chinese text classification review</article-title>
          <year>2018</year>
          <conf-name>9th International Conference on Information Technology in Medicine and Education (ITME)</conf-name>
          <conf-date>2018 October 19-21</conf-date>
          <conf-loc>Hangzhou, China</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Branca Vergano</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Monesi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vicenti</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bizzoca</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Solarino</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Moretti</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Posterior approaches in malleolar fracture: when, why and how</article-title>
          <source>J Biol Regul Homeost Agents</source>
          <year>2020</year>
          <volume>34</volume>
          <issue>3 Suppl. 2</issue>
          <fpage>89</fpage>
          <lpage>95. ADVANCES IN MUSCULOSKELETAL DISEASES AND INFECTIONS</lpage>
          <pub-id pub-id-type="medline">32856446</pub-id>
          <pub-id pub-id-type="pii">14</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>WW</given-names>
            </name>
            <name name-style="western">
              <surname>Dowling</surname>
              <given-names>JN</given-names>
            </name>
            <name name-style="western">
              <surname>Wagner</surname>
              <given-names>MM</given-names>
            </name>
          </person-group>
          <article-title>Classification of emergency department chief complaints into 7 syndromes: a retrospective analysis of 527,228 patients</article-title>
          <source>Ann Emerg Med</source>
          <year>2005</year>
          <volume>46</volume>
          <issue>5</issue>
          <fpage>445</fpage>
          <lpage>455</lpage>
          <pub-id pub-id-type="doi">10.1016/j.annemergmed.2005.04.012</pub-id>
          <pub-id pub-id-type="medline">16271676</pub-id>
          <pub-id pub-id-type="pii">S0196-0644(05)00464-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>WW</given-names>
            </name>
            <name name-style="western">
              <surname>Christensen</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Wagner</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Haug</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ivanov</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Dowling</surname>
              <given-names>JN</given-names>
            </name>
            <name name-style="western">
              <surname>Olszewski</surname>
              <given-names>RT</given-names>
            </name>
          </person-group>
          <article-title>Classifying free-text triage chief complaints into syndromic categories with natural language processing</article-title>
          <source>Artif Intell Med</source>
          <year>2005</year>
          <volume>33</volume>
          <issue>1</issue>
          <fpage>31</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2004.04.001</pub-id>
          <pub-id pub-id-type="medline">15617980</pub-id>
          <pub-id pub-id-type="pii">S093336570400051X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Levin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Finley</surname>
              <given-names>PD</given-names>
            </name>
            <name name-style="western">
              <surname>Heilig</surname>
              <given-names>CM</given-names>
            </name>
          </person-group>
          <article-title>Chief complaint classification with recurrent neural networks</article-title>
          <source>J Biomed Inform</source>
          <year>2019</year>
          <volume>93</volume>
          <fpage>103158</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(19)30076-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103158</pub-id>
          <pub-id pub-id-type="medline">30926471</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(19)30076-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC10563436</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Karagounis</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sarkar</surname>
              <given-names>IN</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>ES</given-names>
            </name>
          </person-group>
          <article-title>Coding free-text chief complaints from a health information exchange: a preliminary study</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2020</year>
          <volume>2020</volume>
          <fpage>638</fpage>
          <lpage>647</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33936438"/>
          </comment>
          <pub-id pub-id-type="medline">33936438</pub-id>
          <pub-id pub-id-type="pii">098_3410538</pub-id>
          <pub-id pub-id-type="pmcid">PMC8075463</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tootooni</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Pasupathy</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Heaton</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Clements</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Sir</surname>
              <given-names>MY</given-names>
            </name>
          </person-group>
          <article-title>CCMapper: an adaptive NLP-based free-text chief complaint mapping algorithm</article-title>
          <source>Comput Biol Med</source>
          <year>2019</year>
          <volume>113</volume>
          <fpage>103398</fpage>
          <pub-id pub-id-type="doi">10.1016/j.compbiomed.2019.103398</pub-id>
          <pub-id pub-id-type="medline">31454613</pub-id>
          <pub-id pub-id-type="pii">S0010-4825(19)30275-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arnaud</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Elbattah</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gignon</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dequen</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>NLP-based prediction of medical specialties at hospital admission using triage notes</article-title>
          <year>2021</year>
          <conf-name>2021 IEEE 9th International Conference on Healthcare Informatics (ICHI)</conf-name>
          <conf-date>2021  August 09-12</conf-date>
          <conf-loc>Victoria, BC, Canada</conf-loc>
          <publisher-name>IEEE</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1109/ICHI52183.2021.00103"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/ichi52183.2021.00103</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Goudie</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Arendts</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Meka</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Freeman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Walker</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Sprivulis</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sanfilippo</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Bennamoun</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dwivedi</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Applications of natural language processing at emergency department triage: a narrative review</article-title>
          <source>PLoS One</source>
          <year>2023</year>
          <volume>18</volume>
          <issue>12</issue>
          <fpage>e0279953</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0279953"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0279953</pub-id>
          <pub-id pub-id-type="medline">38096321</pub-id>
          <pub-id pub-id-type="pii">PONE-D-22-34634</pub-id>
          <pub-id pub-id-type="pmcid">PMC10721204</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Branca Vergano</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Monesi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vicenti</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bizzoca</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Solarino</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Moretti</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Posterior approaches in malleolar fracture: when, why and how</article-title>
          <source>J Biol Regul Homeost Agents</source>
          <year>2020</year>
          <volume>34</volume>
          <issue>3 Suppl. 2</issue>
          <fpage>89</fpage>
          <lpage>95. ADVANCES IN MUSCULOSKELETAL DISEASES AND INFECTIONS</lpage>
          <pub-id pub-id-type="medline">32856446</pub-id>
          <pub-id pub-id-type="pii">14</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rustam</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Khalid</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Aslam</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Rupapara</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Mehmood</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>GS</given-names>
            </name>
          </person-group>
          <article-title>A performance comparison of supervised machine learning models for Covid-19 tweets sentiment analysis</article-title>
          <source>PLoS One</source>
          <year>2021</year>
          <volume>16</volume>
          <issue>2</issue>
          <fpage>e0245909</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0245909"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0245909</pub-id>
          <pub-id pub-id-type="medline">33630869</pub-id>
          <pub-id pub-id-type="pii">PONE-D-20-26707</pub-id>
          <pub-id pub-id-type="pmcid">PMC7906356</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Karakaya</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Kilimci</surname>
              <given-names>ZH</given-names>
            </name>
          </person-group>
          <article-title>An efficient consolidation of word embedding and deep learning techniques for classifying anticancer peptides: FastText+BiLSTM</article-title>
          <source>PeerJ Comput Sci</source>
          <year>2024</year>
          <volume>10</volume>
          <fpage>e1831</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38435607"/>
          </comment>
          <pub-id pub-id-type="doi">10.7717/peerj-cs.1831</pub-id>
          <pub-id pub-id-type="medline">38435607</pub-id>
          <pub-id pub-id-type="pii">cs-1831</pub-id>
          <pub-id pub-id-type="pmcid">PMC10909209</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alhazzani</surname>
              <given-names>NZ</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Turaiki</surname>
              <given-names>IM</given-names>
            </name>
            <name name-style="western">
              <surname>Alkhodair</surname>
              <given-names>SA</given-names>
            </name>
          </person-group>
          <article-title>Text classification of patient experience comments in Saudi dialect using deep learning techniques</article-title>
          <source>Applied Sciences</source>
          <year>2023</year>
          <volume>13</volume>
          <issue>18</issue>
          <fpage>10305</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/app131810305</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cascella</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Semeraro</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Montomoli</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bellini</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Piazza</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Bignami</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>The breakthrough of large language models release for medical applications: 1-year timeline and perspectives</article-title>
          <source>J Med Syst</source>
          <year>2024</year>
          <volume>48</volume>
          <issue>1</issue>
          <fpage>22</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38366043"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s10916-024-02045-3</pub-id>
          <pub-id pub-id-type="medline">38366043</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10916-024-02045-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC10873461</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Costa</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Flores</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Generative large language models are all-purpose text analytics engines: text-to-text learning is all your need</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2024</year>
          <volume>31</volume>
          <issue>9</issue>
          <fpage>1892</fpage>
          <lpage>1903</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocae078</pub-id>
          <pub-id pub-id-type="medline">38630580</pub-id>
          <pub-id pub-id-type="pii">7648661</pub-id>
          <pub-id pub-id-type="pmcid">PMC11339507</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Valmianski,</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Goodwin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Finn</surname>
              <given-names>IM</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Zisook</surname>
              <given-names>DS</given-names>
            </name>
          </person-group>
          <article-title>Evaluating robustness of language models for chief complaint extraction from patient-generated text</article-title>
          <source>arXiv:1911.06915</source>
          <year>2019</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.1911.06915"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>KS</given-names>
            </name>
          </person-group>
          <article-title>A statistical interpretation of term specificity and its application in retrieval</article-title>
          <source>Journal of Documentation</source>
          <year>1972</year>
          <volume>28</volume>
          <issue>1</issue>
          <fpage>11</fpage>
          <lpage>21</lpage>
          <pub-id pub-id-type="doi">10.1108/eb026526</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ehwerhemuepha</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Rakovski</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>A comparative study on deep learning models for text classification of unstructured medical notes with various levels of class imbalance</article-title>
          <source>BMC Med Res Methodol</source>
          <year>2022</year>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>181</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/s12874-022-01665-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12874-022-01665-y</pub-id>
          <pub-id pub-id-type="medline">35780100</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12874-022-01665-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC9250736</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Convolutional neural networks for sentence classification</article-title>
          <year>2014</year>
          <conf-name>Proceedings of the 2014 Conference on Empirical Methods in Natural Language Processing (EMNLP)</conf-name>
          <conf-date>November 28, 2024</conf-date>
          <conf-loc>Doha, Qatar</conf-loc>
          <fpage>1746</fpage>
          <lpage>1751</lpage>
          <pub-id pub-id-type="doi">10.3115/v1/d14-1181</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Convolutional recurrent neural networks for text classification</article-title>
          <year>2019</year>
          <conf-name>2019 International Joint Conference on Neural Networks (IJCNN)</conf-name>
          <conf-date>July 14-19, 2019</conf-date>
          <conf-loc>Budapest, Hungary</conf-loc>
          <publisher-name>IEEE</publisher-name>
          <fpage>1</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1109/ijcnn.2019.8852406</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mccallum</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nigam</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>A comparison of event models for naive Bayes text classification</article-title>
          <source>AAAI-98 Workshop on Learning for text Categorization</source>
          <year>1998</year>
          <access-date>2024-12-04</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cdn.aaai.org/Workshops/1998/WS-98-05/WS98-05-007.pdf">https://cdn.aaai.org/Workshops/1998/WS-98-05/WS98-05-007.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>CY</given-names>
            </name>
            <name name-style="western">
              <surname>Hovy</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Automatic evaluation of summaries using N-gram co-occurrence statistics</article-title>
          <year>2003</year>
          <conf-name>NAACL '03: Proceedings of the 2003 Conference of the North American Chapter of the Association for Computational Linguistics on Human Language Technology</conf-name>
          <conf-date>2003 May 27</conf-date>
          <conf-loc>Edmonton, Alberta, Canada</conf-loc>
          <publisher-loc>New York</publisher-loc>
          <publisher-name>ACM</publisher-name>
          <pub-id pub-id-type="doi">10.3115/1073445.1073465</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yoshida</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>TFIDF, LSI and multi-word in information retrieval and text categorization</article-title>
          <year>2009</year>
          <conf-name>2008 IEEE International Conference on Systems, Man and Cybernetics</conf-name>
          <conf-date>2008 October 12-15</conf-date>
          <conf-loc>Singapore</conf-loc>
          <publisher-loc>Piscataway</publisher-loc>
          <publisher-name>IEEE</publisher-name>
          <fpage>108</fpage>
          <lpage>113</lpage>
          <pub-id pub-id-type="doi">10.1109/icsmc.2008.4811259</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Joachims</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Text categorization with support vector machines: learning with many relevant features</article-title>
          <year>1998</year>
          <conf-name>ECML'98: Proceedings of the 10th European Conference on Machine Learning</conf-name>
          <conf-date>1998 April 21-23</conf-date>
          <conf-loc>Berlin, Heidelberg</conf-loc>
          <fpage>137</fpage>
          <lpage>142</lpage>
          <pub-id pub-id-type="doi">10.1007/bfb0026683</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Genkin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lewis</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Madigan</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Large-scale Bayesian logistic regression for text categorization</article-title>
          <source>Technometrics</source>
          <year>2007</year>
          <volume>49</volume>
          <issue>3</issue>
          <fpage>291</fpage>
          <lpage>304</lpage>
          <pub-id pub-id-type="doi">10.1198/004017007000000245</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>An</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Chinese text classification by combining Chinese-BERTology-wwm and GCN</article-title>
          <source>PeerJ Comput Sci</source>
          <year>2023</year>
          <volume>9</volume>
          <fpage>e1544</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37705631"/>
          </comment>
          <pub-id pub-id-type="doi">10.7717/peerj-cs.1544</pub-id>
          <pub-id pub-id-type="medline">37705631</pub-id>
          <pub-id pub-id-type="pii">cs-1544</pub-id>
          <pub-id pub-id-type="pmcid">PMC10495955</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Chinese text classification model based on deep learning</article-title>
          <source>Future Internet</source>
          <year>2018</year>
          <volume>10</volume>
          <issue>11</issue>
          <fpage>113</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3390/fi10110113"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/fi10110113</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Phung</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tran</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rana</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Karmakar</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Shilton</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yearwood</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dimitrova</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>TB</given-names>
            </name>
            <name name-style="western">
              <surname>Venkatesh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Berk</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Guidelines for developing and reporting machine learning predictive models in biomedical research: a multidisciplinary view</article-title>
          <source>J Med Internet Res</source>
          <year>2016</year>
          <volume>18</volume>
          <issue>12</issue>
          <fpage>e323</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2016/12/e323/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.5870</pub-id>
          <pub-id pub-id-type="medline">27986644</pub-id>
          <pub-id pub-id-type="pii">v18i12e323</pub-id>
          <pub-id pub-id-type="pmcid">PMC5238707</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Punctuation as implicit annotations for Chinese word segmentation</article-title>
          <source>Computational Linguistics</source>
          <year>2009</year>
          <volume>35</volume>
          <issue>4</issue>
          <fpage>505</fpage>
          <lpage>512</lpage>
          <pub-id pub-id-type="doi">10.1162/coli.2009.35.4.35403</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Beauprez</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Bidet-Ildei</surname>
              <given-names>CB</given-names>
            </name>
            <name name-style="western">
              <surname>Hiraki</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Does watching Han Solo or C-3PO similarly influence our language processing?</article-title>
          <source>Psychol Res</source>
          <year>2020</year>
          <volume>84</volume>
          <issue>6</issue>
          <fpage>1572</fpage>
          <lpage>1585</lpage>
          <pub-id pub-id-type="doi">10.1007/s00426-019-01169-3</pub-id>
          <pub-id pub-id-type="medline">30931488</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00426-019-01169-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Combining probability models and web mining models: a framework for proper name transliteration</article-title>
          <source>Inf Technol Manage</source>
          <year>2007</year>
          <volume>9</volume>
          <issue>2</issue>
          <fpage>91</fpage>
          <lpage>103</lpage>
          <pub-id pub-id-type="doi">10.1007/s10799-007-0031-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bansal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Saini</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Yadav</surname>
              <given-names>JK</given-names>
            </name>
          </person-group>
          <article-title>Analysis of SMOTE: modified for diverse imbalanced datasets under the IoT environment</article-title>
          <source>International Journal of Information Retrieval Research</source>
          <year>2021</year>
          <volume>11</volume>
          <issue>2</issue>
          <fpage>23</fpage>
          <pub-id pub-id-type="doi">10.4018/ijirr.2021040102</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ren</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Nie</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kuang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>A COVID-19 risk score combining chest CT radiomics and clinical characteristics to differentiate COVID-19 pneumonia from other viral pneumonias</article-title>
          <source>Aging (Albany NY)</source>
          <year>2021</year>
          <volume>13</volume>
          <issue>7</issue>
          <fpage>9186</fpage>
          <lpage>9224</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aging-us.com/full/202735"/>
          </comment>
          <pub-id pub-id-type="doi">10.18632/aging.202735</pub-id>
          <pub-id pub-id-type="medline">33713401</pub-id>
          <pub-id pub-id-type="pii">202735</pub-id>
          <pub-id pub-id-type="pmcid">PMC8064216</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chawla</surname>
              <given-names>NV</given-names>
            </name>
            <name name-style="western">
              <surname>Bowyer</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>LO</given-names>
            </name>
            <name name-style="western">
              <surname>Kegelmeyer</surname>
              <given-names>WP</given-names>
            </name>
          </person-group>
          <article-title>SMOTE: synthetic minority over-sampling technique</article-title>
          <source>JAIR</source>
          <year>2002</year>
          <volume>16</volume>
          <fpage>321</fpage>
          <lpage>357</lpage>
          <pub-id pub-id-type="doi">10.1613/jair.953</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wilcox</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>The role of domain knowledge in automating medical text report classification</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2003</year>
          <volume>10</volume>
          <issue>4</issue>
          <fpage>330</fpage>
          <lpage>338</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/12668687"/>
          </comment>
          <pub-id pub-id-type="doi">10.1197/jamia.M1157</pub-id>
          <pub-id pub-id-type="medline">12668687</pub-id>
          <pub-id pub-id-type="pii">M1157</pub-id>
          <pub-id pub-id-type="pmcid">PMC181983</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jerng</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>HY</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>YC</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>HW</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>Comparison of complaints to the intensive care units and those to the general wards: an analysis using the Healthcare Complaint Analysis Tool in an academic medical center in Taiwan</article-title>
          <source>Crit Care</source>
          <year>2018</year>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>335</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ccforum.biomedcentral.com/articles/10.1186/s13054-018-2271-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13054-018-2271-y</pub-id>
          <pub-id pub-id-type="medline">30522508</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13054-018-2271-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC6282256</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dhakal</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>NVivo</article-title>
          <source>J Med Libr Assoc</source>
          <year>2022</year>
          <volume>110</volume>
          <issue>2</issue>
          <fpage>270</fpage>
          <lpage>272</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35440911"/>
          </comment>
          <pub-id pub-id-type="doi">10.5195/jmla.2022.1271</pub-id>
          <pub-id pub-id-type="medline">35440911</pub-id>
          <pub-id pub-id-type="pii">jmla.2022.1271</pub-id>
          <pub-id pub-id-type="pmcid">PMC9014916</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Policy analysis of the integration of sports and medicine against the backdrop of "Healthy China": a qualitative study using NVivo</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2023</year>
          <volume>20</volume>
          <issue>3</issue>
          <fpage>2079</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph20032079"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph20032079</pub-id>
          <pub-id pub-id-type="medline">36767445</pub-id>
          <pub-id pub-id-type="pii">ijerph20032079</pub-id>
          <pub-id pub-id-type="pmcid">PMC9915374</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yamanouchi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Nakamura</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ikeda</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Usuku</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>An alternative application of natural language processing to express a characteristic feature of diseases in Japanese medical records</article-title>
          <source>Methods Inf Med</source>
          <year>2023</year>
          <volume>62</volume>
          <issue>3-04</issue>
          <fpage>110</fpage>
          <lpage>118</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.thieme-connect.com/DOI/DOI?10.1055/a-2039-3773"/>
          </comment>
          <pub-id pub-id-type="doi">10.1055/a-2039-3773</pub-id>
          <pub-id pub-id-type="medline">36809794</pub-id>
          <pub-id pub-id-type="pmcid">PMC10462427</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>ZG</given-names>
            </name>
          </person-group>
          <article-title>Machine translation of Chinese classical poetry: a comparison among ChatGPT, Google Translate, and DeepL Translator</article-title>
          <source>Humanit Soc Sci Commun</source>
          <year>2024</year>
          <month>06</month>
          <day>26</day>
          <volume>11</volume>
          <issue>1</issue>
          <pub-id pub-id-type="doi">10.1057/s41599-024-03363-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reader</surname>
              <given-names>TW</given-names>
            </name>
            <name name-style="western">
              <surname>Gillespie</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Patient complaints in healthcare systems: a systematic review and coding taxonomy</article-title>
          <source>BMJ Qual Saf</source>
          <year>2014</year>
          <volume>23</volume>
          <issue>8</issue>
          <fpage>678</fpage>
          <lpage>689</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://qualitysafety.bmj.com/lookup/pmidlookup?view=long&#38;pmid=24876289"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjqs-2013-002437</pub-id>
          <pub-id pub-id-type="medline">24876289</pub-id>
          <pub-id pub-id-type="pii">bmjqs-2013-002437</pub-id>
          <pub-id pub-id-type="pmcid">PMC4112446</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>HaCohen-Kerner</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Dilmon</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hone</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ben-Basan</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Automatic classification of complaint letters according to service provider categories</article-title>
          <source>Information Processing &#38; Management</source>
          <year>2019</year>
          <volume>56</volume>
          <issue>6</issue>
          <fpage>102102</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.ipm.2019.102102"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ipm.2019.102102</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Oyedele</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Determining the optimal number of folds to use in a K-fold cross-validation: a neural network classification experiment</article-title>
          <source>Research in Mathematics</source>
          <year>2023</year>
          <volume>10</volume>
          <issue>1</issue>
          <pub-id pub-id-type="doi">10.1080/27684830.2023.2201015</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Elmessiry</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>WO</given-names>
            </name>
            <name name-style="western">
              <surname>Catron</surname>
              <given-names>TF</given-names>
            </name>
            <name name-style="western">
              <surname>Karrass</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>MP</given-names>
            </name>
          </person-group>
          <article-title>Triaging patient complaints: Monte Carlo cross-validation of six machine learning classifiers</article-title>
          <source>JMIR Med Inform</source>
          <year>2017</year>
          <volume>5</volume>
          <issue>3</issue>
          <fpage>e19</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2017/3/e19/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/medinform.7140</pub-id>
          <pub-id pub-id-type="medline">28760726</pub-id>
          <pub-id pub-id-type="pii">v5i3e19</pub-id>
          <pub-id pub-id-type="pmcid">PMC5556254</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cortes</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Vapnik</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Support-vector networks</article-title>
          <source>Mach Learn</source>
          <year>1995</year>
          <volume>20</volume>
          <issue>3</issue>
          <fpage>273</fpage>
          <lpage>297</lpage>
          <pub-id pub-id-type="doi">10.1007/BF00994018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tolles</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Meurer</surname>
              <given-names>WJ</given-names>
            </name>
          </person-group>
          <article-title>Logistic regression: relating patient characteristics to outcomes</article-title>
          <source>JAMA</source>
          <year>2016</year>
          <volume>316</volume>
          <issue>5</issue>
          <fpage>533</fpage>
          <lpage>534</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2016.7653</pub-id>
          <pub-id pub-id-type="medline">27483067</pub-id>
          <pub-id pub-id-type="pii">2540383</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McCallum</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <source>Graphical Models, Lecture2: Bayesian Network Representation</source>
          <year>2019</year>
          <access-date>2022-10-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://people.cs.umass.edu/~mccallum/courses/gm2011/02-bn-rep.pdf">https://people.cs.umass.edu/~mccallum/courses/gm2011/02-bn-rep.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vakharia</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Suthar</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>VK</given-names>
            </name>
            <name name-style="western">
              <surname>Solanki</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Hybrid perovskites thin films morphology identification by adapting multiscale-SinGAN architecture, heat transfer search optimized feature selection and machine learning algorithms</article-title>
          <source>Phys. Scr</source>
          <year>2023</year>
          <volume>98</volume>
          <issue>2</issue>
          <fpage>025203</fpage>
          <pub-id pub-id-type="doi">10.1088/1402-4896/acae49</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>YA</given-names>
            </name>
            <name name-style="western">
              <surname>Awwad</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Razgan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Maarouf</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Hyperparameter search for machine learning algorithms for optimizing the computational complexity</article-title>
          <source>Processes</source>
          <year>2023</year>
          <volume>11</volume>
          <issue>2</issue>
          <fpage>349</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3390/pr11020349"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/pr11020349</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nair</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Vakharia</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Woźniak</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shafi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fazal Ijaz</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>AI-driven digital twin model for reliable lithium-ion battery discharge capacity predictions</article-title>
          <source>International Journal of Intelligent Systems</source>
          <year>2024</year>
          <volume>2024</volume>
          <fpage>1</fpage>
          <lpage>18</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1155/2024/8185044"/>
          </comment>
          <pub-id pub-id-type="doi">10.1155/2024/8185044</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
