<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id><journal-id journal-id-type="publisher-id">jmir</journal-id><journal-id journal-id-type="index">1</journal-id><journal-title>Journal of Medical Internet Research</journal-title><abbrev-journal-title>J Med Internet Res</abbrev-journal-title><issn pub-type="epub">1438-8871</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v28i1e89850</article-id><article-id pub-id-type="doi">10.2196/89850</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Automated Identification of Nursing Diagnoses and Interventions From Nursing Records Using a Retrieval-Augmented Large Language Model Approach: Quantitative Study</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Li</surname><given-names>Minye</given-names></name><degrees>MAST, RN</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Chen</surname><given-names>Dianjie</given-names></name><degrees>RN</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Xiao</surname><given-names>Qun</given-names></name><degrees>RN</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>He</surname><given-names>Zhengji</given-names></name><degrees>RN</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zhang</surname><given-names>Yanyan</given-names></name><degrees>RN</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zhong</surname><given-names>Jinlan</given-names></name><degrees>RN</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Luo</surname><given-names>Yiwei</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Ma</surname><given-names>Hui</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Nursing, Chinese People's Liberation Army General Hospital</institution><addr-line>28 Fuxing Road, Haidian District</addr-line><addr-line>Beijing</addr-line><addr-line>Beijing</addr-line><country>China</country></aff><aff id="aff2"><institution>Department of Infectious Diseases, 5th Medical Center, Chinese People's Liberation Army General Hospital</institution><addr-line>Beijing</addr-line><addr-line>Beijing</addr-line><country>China</country></aff><aff id="aff3"><institution>School of Nursing, Southern Medical University</institution><addr-line>Guangzhou</addr-line><addr-line>Guangdong</addr-line><country>China</country></aff><aff id="aff4"><institution>Department of Respiratory and Critical Care Medicine, 1st Medical Center, Chinese People's Liberation Army General Hospital</institution><addr-line>Beijing</addr-line><addr-line>Beijing</addr-line><country>China</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Coristine</surname><given-names>Andrew</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Yang</surname><given-names>Juntao</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Cesare</surname><given-names>Manuele</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Hui Ma, PhD, Department of Nursing, Chinese People's Liberation Army General Hospital, 28 Fuxing Road, Haidian District, Beijing, Beijing, China, 86 13681197727; <email>mahui-28@163.com</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>29</day><month>4</month><year>2026</year></pub-date><volume>28</volume><elocation-id>e89850</elocation-id><history><date date-type="received"><day>18</day><month>12</month><year>2025</year></date><date date-type="rev-recd"><day>29</day><month>03</month><year>2026</year></date><date date-type="accepted"><day>29</day><month>03</month><year>2026</year></date></history><copyright-statement>&#x00A9; Minye Li, Dianjie Chen, Qun Xiao, Zhengji He, Yanyan Zhang, Jinlan Zhong, Yiwei Luo, Hui Ma. Originally published in the Journal of Medical Internet Research (<ext-link ext-link-type="uri" xlink:href="https://www.jmir.org">https://www.jmir.org</ext-link>), 29.4.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.jmir.org/">https://www.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://www.jmir.org/2026/1/e89850"/><abstract><sec><title>Background</title><p>Electronic health records (EHRs) have been widely adopted, but most nursing records remain in unstructured free-text format, which limits the secondary use of nursing data. Standardized terminologies improve semantic interoperability; however, manual annotation is labor intensive and yields inconsistent results. Advances in large language models (LLMs) and retrieval-augmented generation (RAG) have created new possibilities for automating the mapping of nursing records to standardized terminologies, thereby enhancing the utility of nursing data.</p></sec><sec><title>Objective</title><p>This study aimed to develop and evaluate Clinical Care Classification nursing terminology with retrieval-augmented mapping (CNTRAM), a 2-stage RAG framework incorporating an LLM, for the automated mapping of nursing diagnoses and interventions from free-text intensive care unit nursing records to standardized Clinical Care Classification (CCC) terms.</p></sec><sec sec-type="methods"><title>Methods</title><p>CNTRAM is a 2-stage retrieval-augmented framework that integrates dense embedding retrieval, retrieval-enhanced prompting, and few-shot LLM guidance to map free-text nursing records to standardized CCC terminology. Free-text records and their segments were embedded as subqueries to retrieve the most relevant CCC reference entries and annotated examples, which were merged to construct context windows. Each subquery was combined with its retrieved context using a predefined RAG prompt template that enforces CCC coding rules and a structured JSON schema and was then processed by an LLM to generate CCC outputs. A gold standard dataset of 100 intensive care unit nursing records was annotated by 3 senior nurses and finalized via consensus, with interrater reliability quantified using the Fleiss &#x03BA;. Model performance was compared with traditional baselines (term frequency&#x2013;inverse document frequency, Bidirectional Encoder Representations from Transformer, and fine-tuned Bidirectional Encoder Representations from Transformers model) and 4 LLMs (Mistral-7B, Qwen3-14B, Llama3.3-70B, and DeepSeek-R1) across no-RAG, zero-shot, and few-shot settings, using precision, recall, <italic>F</italic><sub>1</sub>-score, and intersection over union (IoU) as metrics.</p></sec><sec sec-type="results"><title>Results</title><p>Interrater agreement was substantial, with Fleiss &#x03BA;=0.6449 for diagnoses and &#x03BA;=0.6180 for interventions. CNTRAM achieved substantial performance gains over all baseline approaches. For nursing diagnoses, DeepSeek-R1 with RAG+few-shot prompting achieved the best performance, with a precision of 0.7909, a recall of 0.7901, an <italic>F</italic><sub>1</sub>-score of 0.7836, and an IoU of 0.7614. These results were significantly higher than those of traditional baselines (<italic>F</italic><sub>1</sub>-score 0.0268&#x2010;0.2027), no-RAG LLMs (<italic>F</italic><sub>1</sub>-score 0.0299&#x2010;0.0588), and RAG+zero-shot LLMs (<italic>F</italic><sub>1</sub>-score 0.0716&#x2010;0.2160). For nursing interventions, the same configuration achieved a precision of 0.8453, a recall of 0.8504, an <italic>F</italic><sub>1</sub>-score of 0.8413, and an IoU of 0.8097, outperforming traditional baselines (<italic>F</italic><sub>1</sub>-score 0.1200&#x2010;0.2323), no-RAG LLMs (<italic>F</italic><sub>1</sub>-score 0.0077&#x2010;0.0189), and RAG+zero-shot LLMs (<italic>F</italic><sub>1</sub>-score 0.2744&#x2010;0.4461).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This study developed CNTRAM, an LLM-based 2-stage RAG framework that combines dense embedding retrieval and few-shot prompting for CCC terminology mapping. Using DeepSeek-R1, CNTRAM outperformed baseline models, improved mapping accuracy, and provided a feasible solution for standardizing unstructured nursing data.</p></sec></abstract><kwd-group><kwd>large language model</kwd><kwd>LLM</kwd><kwd>retrieval-augmented generation</kwd><kwd>RAG</kwd><kwd>nursing terminology</kwd><kwd>Clinical Care Classification</kwd><kwd>nursing records</kwd><kwd>nursing informatics</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>The widespread adoption of electronic health records (EHRs) has significantly enhanced the collection and use of clinical data [<xref ref-type="bibr" rid="ref1">1</xref>], providing a solid foundation for data-driven research and continuous improvement of health care practices [<xref ref-type="bibr" rid="ref2">2</xref>]. Within EHR systems, nursing records constitute a core data source, documenting nurses&#x2019; clinical observations, patient assessments, symptom responses, and nursing interventions delivered during routine care [<xref ref-type="bibr" rid="ref3">3</xref>]. These records support clinical decision-making and care planning and also constitute an important primary data source for nursing research [<xref ref-type="bibr" rid="ref4">4</xref>]. Despite the transition of nursing documentation from paper-based to electronic systems, most nursing records are still recorded in unstructured free-text form. This lack of structure substantially constrains their secondary use, semantic interoperability, and integration into clinical decision support systems [<xref ref-type="bibr" rid="ref5">5</xref>].</p><p>To address these challenges, standardized nursing terminologies (SNTs) have been developed to enhance the consistency, comparability, and interoperability of nursing records [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. Among them, the Clinical Care Classification (CCC) system is a comprehensive, coded nursing terminology designed specifically for the digital documentation of nursing care [<xref ref-type="bibr" rid="ref8">8</xref>]. The CCC system comprises 176 nursing diagnoses and 201 core nursing interventions, organized into 21 care components covering physiological, functional, psychological, and health behavioral domains. By integrating nursing diagnoses, interventions, and outcomes within a unified structure, CCC provides a systematic framework for representing nursing practice [<xref ref-type="bibr" rid="ref9">9</xref>]. Compared to the more complex and granular North American Nursing Diagnosis Association International (NANDA-I), Nursing Interventions Classification (NIC), or International Classification for Nursing Practice systems, the CCC system has a more compact semantic space, reducing conceptual ambiguity during the automatic mapping process [<xref ref-type="bibr" rid="ref10">10</xref>]. A Chinese translation of the CCC system was released in 2018 to support its application in Chinese-language clinical settings, enabling standardized nursing documentation in Chinese hospitals and improving the interoperability of nursing data [<xref ref-type="bibr" rid="ref11">11</xref>].</p><p>Mapping free-text nursing records to CCC terms enables the structured representation of nursing care processes, supports care quality assessment, and facilitates large-scale nursing research [<xref ref-type="bibr" rid="ref12">12</xref>]. However, CCC-based annotation still relies heavily on manual coding, which is labor intensive, time consuming, and subject to interannotator variability, highlighting the urgent need for automated solutions that can reliably link unstructured nursing text to standardized terminology [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>].</p><p>Recent advances in natural language processing and machine learning have substantially improved the automated structuring of unstructured clinical text [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref17">17</xref>]. Early rule-based and dictionary matching approaches were limited by heavy manual maintenance and poor generalizability to complex nursing language [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. The advent of pretrained contextual models, such as Bidirectional Encoder Representations from Transformers (BERT) [<xref ref-type="bibr" rid="ref20">20</xref>], enabled deeper semantic understanding and improved performance in tasks such as entity recognition, relation extraction, and text classification. Recently, large language models (LLMs) have further revolutionized the field, exhibiting strong capabilities in long-text comprehension, zero- and few-shot learning, and structured text generation [<xref ref-type="bibr" rid="ref21">21</xref>]. Techniques such as retrieval-augmented generation (RAG) further enhance factual accuracy and interpretability by integrating external knowledge retrieval [<xref ref-type="bibr" rid="ref22">22</xref>]. For example, a nursing-focused study showed that integrating a curated breast cancer nursing knowledge base with GPT-4 (OpenAI) improved the accuracy and clinical relevance of nursing responses while preserving empathetic communication [<xref ref-type="bibr" rid="ref23">23</xref>].</p><p>Despite these technological advances, applications within nursing informatics remain limited. Most existing methods are rule driven, limited in scalability, or focused on general clinical text processing, while studies specifically targeting the automated identification of nursing diagnoses and interventions remain scarce. To address this gap, this study proposes an LLM-based framework for the automated extraction of nursing diagnoses and interventions aligned with the CCC system, aiming to reduce reliance on manual coding by nurses, enhance interoperability, and support data-driven decision-making in nursing practice.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Ethical Considerations</title><p>This study was approved by the ethics committee of the Chinese People&#x2019;s Liberation Army General Hospital (S2024-767-01). Given the retrospective nature of this study, the requirement for written informed consent was waived by the ethics committee. No compensation was provided to participants. All data were fully anonymized before being included in the study. The study adhered to relevant ethical guidelines and protected the privacy and confidentiality of all patient records throughout the research process.</p></sec><sec id="s2-2"><title>Dataset</title><p>This study included 197,337 nursing records from the intensive care unit (ICU) of Chinese People&#x2019;s Liberation Army General Hospital, covering the period from January 2023 to May 2025. These records consisted of free-text descriptions of time-stamped nursing assessments, interventions, and patient responses. All records were deidentified using a validated deidentification pipeline.</p></sec><sec id="s2-3"><title>Gold Standard Data Annotation</title><p>To establish a gold standard dataset for model evaluation, 100 ICU nursing records were randomly selected for expert annotation. Three senior registered nurses, each with &#x003E;5 years of ICU experience and prior familiarity with SNTs, independently annotated the nursing diagnoses and interventions for all samples. Before annotation, the annotators received a structured briefing on the CCC terminology, including term definitions, hierarchical structure, and mapping principles. Annotation was conducted in accordance with the official CCC terminology definitions and classification guidelines. Interrater reliability among the 3 annotators was assessed using the Fleiss &#x03BA;, which indicated substantial agreement. The gold standard dataset was established through discussions among the 3 nurses to reach consensus on differing annotations. A representative annotated example is shown in <xref ref-type="fig" rid="figure1">Figure 1</xref>.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Annotation example. This figure shows how a segment of unstructured intensive care unit nursing text from a local hospital was manually annotated using Clinical Care Classification nursing diagnoses and interventions. Text segments with the same background color indicate the correspondence between the narrative content and the assigned nursing diagnosis or intervention.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e89850_fig01.png"/></fig></sec><sec id="s2-4"><title>Annotated Corpus</title><p>In total, 1500 nursing text samples were randomly selected from the full dataset to construct a manually annotated corpus. Two nursing postgraduate students, each with at least 3 months of ICU training, independently performed annotation after receiving standardized training based on the CCC terminology guidelines. The task involved identifying nursing diagnoses and interventions mentioned in each text and mapping them to the most appropriate CCC terms. When exact matches were unavailable, corresponding NANDA-I and NIC terms were applied as supplementary standards (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). In cases of disagreement, a senior ICU nurse adjudicated the final labels. To ensure data separation, the 100 expert-annotated evaluation records and the 1500 manually annotated corpus samples were sourced from distinct patients.</p></sec><sec id="s2-5"><title>CCC Nursing Terminology With Retrieval-Augmented Mapping</title><p>We developed CCC nursing terminology with retrieval-augmented mapping (CNTRAM), a 2-stage RAG framework, to map free-text nursing records to standardized CCC diagnoses and interventions (<xref ref-type="fig" rid="figure2">Figure 2</xref>). CNTRAM integrates dense embedding retrieval, retrieval-enhanced prompting, and few-shot LLM guidance to improve mapping accuracy and coverage.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Clinical Care Classification (CCC) nursing terminology with retrieval-augmented mapping (CNTRAM) framework. This figure illustrates the 2-stage CNTRAM process for mapping free-text nursing records to standardized CCC diagnoses and interventions. Free-text records are segmented into text chunks, while the original records are retained as subqueries. All subqueries, together with CCC reference entries and annotated corpora, are embedded into 512-dimensional vectors using the BAAI (Beijing Academy of Artificial Intelligence) General Embedding&#x2013;small-zh model. For each subquery, the top 5 most relevant entries are separately retrieved from CCC references and annotated corpora, then merged and deduplicated to construct context windows. Each subquery is combined with its context window to generate prompts under a predefined retrieval-augmented generation template that adheres to CCC coding guidelines and structured JSON output requirements. Prompts are fed into a locally deployed large language model, and the generated JSON outputs are parsed, cross-referenced against the CCC database for metadata validation, and formatted into standardized nursing coding results.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e89850_fig02.png"/></fig><p>In the first stage, free-text records were segmented into text chunks using Chinese and English punctuation, while the original records were retained as subqueries. Given the small scale of the CCC terminology set and its abundant clinically equivalent paraphrases, we prioritized a fine-grained semantic matching strategy. Specifically, we used the BAAI (Beijing Academy of Artificial Intelligence) General Embedding&#x2013;small-zh model to embed each subquery, all CCC reference entries, and the full annotated corpus into 512-dimensional dense vectors. Semantic similarity between subqueries, reference entries, and annotated corpora was computed using matrix-based cosine scoring. In detail, the embedding vectors of subqueries and CCC reference entries were L2 normalized to unit norm. Subsequently, matrix multiplication was performed to compute the dot product of these normalized vectors, generating a similarity matrix of dimensions (number of subqueries&#x00D7;number of reference entries), where each element quantifies the semantic similarity between an individual subquery and a reference entry. Retrieval results from all subqueries were aggregated, and the unique entries remaining after duplicate removal were sorted by their similarity scores. To determine the retrieval window, we evaluated retrieval coverage via Recall@k (k=1, 3, 5, and 10). Recall@5 provided the optimal balance between retrieval sensitivity and computational cost and was adopted as the default setting (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). For each subquery, the top 5 most relevant entries were retrieved separately from both the CCC reference entries and the annotated corpus, merged, and deduplicated to construct context windows.</p><p>In the second stage, prompts were generated by combining each subquery with its retrieved context following a predefined RAG template. This template enforces CCC coding guidelines, which incorporate the supplementary NANDA-I and NIC terms, and defines a structured JSON output schema (<xref ref-type="fig" rid="figure3">Figure 3</xref>). These prompts were then processed by a locally deployed LLM, which generated structured JSON outputs [<xref ref-type="bibr" rid="ref24">24</xref>]. The resulting JSON was parsed with regular expressions, cross-referenced against the term database for metadata validation, and formatted into a standardized structure suitable for downstream analysis.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Clinical Care Classification (CCC) nursing terminology with retrieval-augmented mapping (CNTRAM) prompt. This figure shows the standardized prompt format used in CNTRAM and the expected JSON-based output. The prompt specifies that the model should return CCC nursing diagnosis and intervention codes as a JSON array, without explanatory text or duplication; an empty array is returned if no valid codes are identified.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e89850_fig03.png"/></fig></sec><sec id="s2-6"><title>Experiments</title><p>To establish comparative baselines and evaluate CNTRAM&#x2019;s relative performance, multiple models were implemented, encompassing traditional statistical methods, pretrained language models, and LLMs.</p><p>Free-text inputs were transformed into term frequency&#x2013;inverse document frequency (TF-IDF) vectors [<xref ref-type="bibr" rid="ref25">25</xref>], and candidate CCC terms were ranked by cosine similarity. This served as a lexical-matching baseline reflecting rule-driven coding.</p><p>Contextual embeddings were generated using BERT [<xref ref-type="bibr" rid="ref20">20</xref>]. Semantic similarity between text segments and CCC entries was calculated via cosine distance. This represented a rule-driven baseline with contextual semantic awareness. Additionally, BERT was fine-tuned on the annotated corpus of 1500 records to provide a supervised baseline for comparison.</p><p>Llama3.3-70B (Meta Platforms Inc) [<xref ref-type="bibr" rid="ref26">26</xref>], Qwen3-14B (Alibaba Group) [<xref ref-type="bibr" rid="ref27">27</xref>], Mistral-7B (Mistral AI) [<xref ref-type="bibr" rid="ref28">28</xref>], and DeepSeek-R1 (DeepSeek) [<xref ref-type="bibr" rid="ref29">29</xref>] were evaluated under zero-shot and few-shot prompting to test their intrinsic ability to align free-text nursing notes with CCC terms based solely on coding rules. Additionally, no-RAG experiments were conducted for each LLM to serve as a comparison.</p></sec><sec id="s2-7"><title>Prompting Strategies</title><p>To examine the influence of contextual retrieval and example-based guidance, 2 prompting strategies were compared under the CNTRAM framework.</p><p>First, zero-shot prompting was used; for each generated subquery derived from both the segmented text and the original records, the top 5 most semantically relevant CCC coding rules were retrieved and incorporated into the prompt [<xref ref-type="bibr" rid="ref30">30</xref>]. No example demonstrations were included.</p><p>For few-shot prompting, few-shot examples were selected by retrieving the top 5 most semantically relevant examples for each subquery generated from both the segmented text and the original records [<xref ref-type="bibr" rid="ref31">31</xref>]. These examples were combined with retrieved CCC coding rules, which were generated following the same approach as zero-shot prompting, to form the final prompt. We further assessed the contribution of few-shot examples without retrieval using 20 static examples in the prompt.</p></sec><sec id="s2-8"><title>Evaluation Metrics</title><p>Model performance was evaluated using precision, recall, <italic>F</italic><sub>1</sub>-score, and intersection over union (IoU), with each nursing record treated as a set of terms. CCC terms and supplementary NANDA-I and NIC terms were included in the evaluation. As a single record may contain multiple clinically related diagnoses and interventions, IoU was additionally used to more comprehensively assess the model&#x2019;s ability to identify all nursing terms, capturing their combinatorial characteristics. IoU is defined as the ratio of the intersection to the union of the predicted and gold standard term sets.</p><p>For a given record <italic>i</italic>, let <italic>G</italic><sub><italic>i</italic></sub> denote the gold standard term set and <italic>P</italic><sub><italic>i</italic></sub> denote the predicted term set. In this notation, &#x201C;|&#x22C5;|&#x201D; denotes set cardinality, &#x201C;\&#x201D; denotes set difference, and &#x201C;&#x2229;&#x201D; denotes intersection. The evaluation components were defined as follows:</p><p><inline-formula><mml:math id="ieqn1"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:mi>T</mml:mi><mml:msub><mml:mi>P</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>/</mml:mo></mml:mrow><mml:msub><mml:mi>G</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2229;</mml:mo><mml:msub><mml:mi>P</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>/</mml:mo></mml:mrow><mml:mtext>&#x00A0;</mml:mtext><mml:mo>,</mml:mo><mml:mi>F</mml:mi><mml:msub><mml:mi>P</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mrow><mml:mo>/</mml:mo></mml:mrow><mml:msub><mml:mi>P</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2216;</mml:mo><mml:msub><mml:mi>G</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>/</mml:mo></mml:mrow><mml:mtext>&#x00A0;</mml:mtext><mml:mo>,</mml:mo><mml:mi>F</mml:mi><mml:msub><mml:mi>N</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mrow><mml:mo>/</mml:mo></mml:mrow><mml:msub><mml:mi>G</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2216;</mml:mo><mml:msub><mml:mi>P</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo>/</mml:mo></mml:mrow></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula> </p><p>Metrics for each sample were calculated as follows:</p><disp-formula id="E1"><mml:math id="eqn1"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mi>P</mml:mi><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi><mml:mi>i</mml:mi><mml:mi>s</mml:mi><mml:mi>i</mml:mi><mml:mi>o</mml:mi><mml:msub><mml:mi>n</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mi>P</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mi>P</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mi>F</mml:mi><mml:msub><mml:mi>P</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfrac><mml:mo>,</mml:mo><mml:mi>R</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi><mml:mi>a</mml:mi><mml:mi>l</mml:mi><mml:msub><mml:mi>l</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mi>P</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mi>P</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mi>F</mml:mi><mml:msub><mml:mi>N</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfrac><mml:mo>,</mml:mo><mml:mi>F</mml:mi><mml:msub><mml:mn>1</mml:mn><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mn>2</mml:mn><mml:mo>&#x22C5;</mml:mo><mml:mi>P</mml:mi><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi><mml:mi>i</mml:mi><mml:mi>s</mml:mi><mml:mi>i</mml:mi><mml:mi>o</mml:mi><mml:msub><mml:mi>n</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:mi>R</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi><mml:mi>a</mml:mi><mml:mi>l</mml:mi><mml:msub><mml:mi>l</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:mi>P</mml:mi><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi><mml:mi>i</mml:mi><mml:mi>s</mml:mi><mml:mi>i</mml:mi><mml:mi>o</mml:mi><mml:msub><mml:mi>n</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mi>R</mml:mi><mml:mi>e</mml:mi><mml:mi>c</mml:mi><mml:mi>a</mml:mi><mml:mi>l</mml:mi><mml:msub><mml:mi>l</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfrac></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>and</p><p><inline-formula><mml:math id="ieqn2"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:mi>I</mml:mi><mml:mi>o</mml:mi><mml:msub><mml:mi>U</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mi>P</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:mi>T</mml:mi><mml:msub><mml:mi>P</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mi>F</mml:mi><mml:msub><mml:mi>P</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mi>F</mml:mi><mml:msub><mml:mi>N</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfrac></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula> </p><p>where <italic>TP</italic><sub><italic>i</italic></sub> is the number of correctly predicted terms in record <italic>i</italic>, <italic>FP</italic><sub><italic>i</italic></sub> is the number of predicted terms not in the gold standard set, and <italic>FN</italic><sub><italic>i</italic></sub> is the number of gold standard terms missed by the prediction. Overall performance was calculated as the macroaverage of each metric across all records.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Characteristics of the Dataset</title><p>This dataset contained 197,337 records from 880 patients, representing an older cohort (median age 67, IQR 57-74 years) with a wide range of ICU lengths of stay (median 1 day, IQR 0-6 days), as shown in <xref ref-type="table" rid="table1">Table 1</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Dataset characteristics (N=880).</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Characteristics</td><td align="left" valign="bottom">Values</td></tr></thead><tbody><tr><td align="left" valign="top">Nursing note entries, n</td><td align="left" valign="top">197,337</td></tr><tr><td align="left" valign="top">Age (years), median (IQR)</td><td align="left" valign="top">67 (57-74)</td></tr><tr><td align="left" valign="top">Female sex, n (%)</td><td align="left" valign="top">287 (32.6)</td></tr><tr><td align="left" valign="top">Length of stay in the intensive care unit (days), median (IQR)</td><td align="left" valign="top">1 (0&#x2010;6)</td></tr></tbody></table></table-wrap></sec><sec id="s3-2"><title>Annotator Agreement and Coverage of CCC Terminology</title><p>Interrater reliability was evaluated using the Fleiss &#x03BA;, which measures the degree of agreement among multiple annotators beyond chance. The results showed substantial consistency for both categories, with &#x03BA;=0.65 for nursing diagnoses and &#x03BA;=0.62 for nursing interventions (<xref ref-type="table" rid="table2">Table 2</xref>). These results indicate that the 3 nurses demonstrated a consistent application of CCC terminology during independent annotation, providing a solid foundation for constructing the final consensus-based reference standard used for model evaluation. In terms of terminology coverage, a total of 65 unique nursing diagnoses were observed in the annotated 100-record test set, corresponding to 36.9% of the 176 CCC diagnosis codes. For nursing interventions, 106 unique codes were present, representing 52.7% of the 201 CCC intervention codes.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Fleiss &#x03BA; for interrater agreement among 3 senior registered nurses.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Items</td><td align="left" valign="bottom">Observed agreement</td><td align="left" valign="bottom">Expected agreement</td><td align="left" valign="bottom">1 minus expected agreement</td><td align="left" valign="bottom">Fleiss &#x03BA;</td></tr></thead><tbody><tr><td align="left" valign="top">Nursing diagnoses</td><td align="left" valign="top">0.9886</td><td align="left" valign="top">0.9679</td><td align="left" valign="top">0.0321</td><td align="left" valign="top">0.6449</td></tr><tr><td align="left" valign="top">Nursing interventions</td><td align="left" valign="top">0.9830</td><td align="left" valign="top">0.9555</td><td align="left" valign="top">0.0445</td><td align="left" valign="top">0.6180</td></tr></tbody></table></table-wrap></sec><sec id="s3-3"><title>Model Performance</title><p>The CNTRAM framework demonstrated comprehensive superiority over TF-IDF, BERT, fine-tuned BERT, and zero-shot LLMs in mapping nursing records to standardized CCC terminology by integrating retrieval-enhanced and few-shot prompting. For nursing diagnoses (<xref ref-type="table" rid="table3">Table 3</xref>), the best-performing model was DeepSeek-R1. It achieved a precision of 0.7909, a recall of 0.7901, an <italic>F</italic><sub>1</sub>-score of 0.7836, and an IoU of 0.7614. All other approaches showed lower results across all metrics. Among traditional methods and language models, the <italic>F</italic><sub>1</sub>-score ranged from 0.0268 (BERT) to 0.5253 (Qwen3-14B with RAG+few-shot), and the IoU values ranged from 0.0142 (BERT) to 0.4987 (Qwen3-14B with RAG+few-shot).</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Model performance for mapping nursing diagnoses.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Models and prompting strategies</td><td align="left" valign="bottom">Precision</td><td align="left" valign="bottom">Recall</td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="bottom">Intersection over union</td></tr></thead><tbody><tr><td align="left" valign="top">Term frequency&#x2013;inverse document frequency</td><td align="char" char="." valign="top">0.0738</td><td align="char" char="." valign="top">0.2733</td><td align="char" char="." valign="top">0.0856</td><td align="char" char="." valign="top">0.0685</td></tr><tr><td align="left" valign="top">BERT<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="char" char="." valign="top">0.0155</td><td align="char" char="." valign="top">0.2460</td><td align="char" char="." valign="top">0.0268</td><td align="char" char="." valign="top">0.0142</td></tr><tr><td align="left" valign="top">Fine-tuned BERT</td><td align="char" char="." valign="top">0.2223</td><td align="char" char="." valign="top">0.2233</td><td align="char" char="." valign="top">0.2027</td><td align="char" char="." valign="top">0.1798</td></tr><tr><td align="left" valign="top" colspan="5">No RAG<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mistral-7B</td><td align="char" char="." valign="top">0.0396</td><td align="char" char="." valign="top">0.0316</td><td align="char" char="." valign="top">0.0299</td><td align="char" char="." valign="top">0.0252</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Qwen3-14B</td><td align="char" char="." valign="top">0.0482</td><td align="char" char="." valign="top">0.0406</td><td align="char" char="." valign="top">0.0412</td><td align="char" char="." valign="top">0.0394</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Llama3.3-70B</td><td align="char" char="." valign="top">0.0570</td><td align="char" char="." valign="top">0.0511</td><td align="char" char="." valign="top">0.0515</td><td align="char" char="." valign="top">0.0511</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>DeepSeek-R1</td><td align="char" char="." valign="top">0.0601</td><td align="char" char="." valign="top">0.0582</td><td align="char" char="." valign="top">0.0588</td><td align="char" char="." valign="top">0.0580</td></tr><tr><td align="left" valign="top" colspan="5">RAG+zero-shot</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mistral-7B</td><td align="char" char="." valign="top">0.0727</td><td align="char" char="." valign="top">0.0706</td><td align="char" char="." valign="top">0.0716</td><td align="char" char="." valign="top">0.0704</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Qwen3-14B</td><td align="char" char="." valign="top">0.0992</td><td align="char" char="." valign="top">0.0804</td><td align="char" char="." valign="top">0.0849</td><td align="char" char="." valign="top">0.0800</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Llama3.3-70B</td><td align="char" char="." valign="top">0.1044</td><td align="char" char="." valign="top">0.0906</td><td align="char" char="." valign="top">0.0937</td><td align="char" char="." valign="top">0.0903</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>DeepSeek-R1</td><td align="char" char="." valign="top">0.2310</td><td align="char" char="." valign="top">0.2241</td><td align="char" char="." valign="top">0.2160</td><td align="char" char="." valign="top">0.2003</td></tr><tr><td align="left" valign="top" colspan="5">RAG+few-shot</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mistral-7B</td><td align="char" char="." valign="top">0.4657</td><td align="char" char="." valign="top">0.4374</td><td align="char" char="." valign="top">0.4298</td><td align="char" char="." valign="top">0.3914</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Qwen3-14B</td><td align="char" char="." valign="top">0.5614</td><td align="char" char="." valign="top">0.5213</td><td align="char" char="." valign="top">0.5253</td><td align="char" char="." valign="top">0.4987</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Llama3.3-70B</td><td align="char" char="." valign="top">0.4819</td><td align="char" char="." valign="top">0.4351</td><td align="char" char="." valign="top">0.4455</td><td align="char" char="." valign="top">0.4245</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>DeepSeek-R1</td><td align="char" char="." valign="top"><italic>0.7909</italic></td><td align="char" char="." valign="top"><italic>0.7901</italic></td><td align="char" char="." valign="top"><italic>0.7836</italic></td><td align="char" char="." valign="top"><italic>0.7614</italic></td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>BERT: Bidirectional Encoder Representations from Transformers.</p></fn><fn id="table3fn2"><p><sup>b</sup>RAG: retrieval-augmented generation. </p></fn></table-wrap-foot></table-wrap><p>For nursing interventions (<xref ref-type="table" rid="table4">Table 4</xref>), DeepSeek-R1 again showed the best overall performance, with a precision of 0.8453, a recall of 0.8504, an <italic>F</italic><sub>1</sub>-score of 0.8413, and an IoU of 0.8097. Other traditional methods and language model setups exhibited lower performance, with <italic>F</italic><sub>1</sub>-score varying from 0.0077 (Mistral-7B with no RAG) to 0.5557 (Qwen3-14B with RAG+few-shot) and IoU values ranging from 0.0071 (Mistral-7B with no RAG) to 0.5072 (Qwen3-14B with RAG+few-shot).</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Model performance for mapping nursing interventions.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model and prompting strategies</td><td align="left" valign="bottom">Precision</td><td align="left" valign="bottom">Recall</td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="bottom">Intersection over union</td></tr></thead><tbody><tr><td align="left" valign="top">Term frequency&#x2013;inverse document frequency</td><td align="char" char="." valign="top">0.2112</td><td align="char" char="." valign="top">0.5508</td><td align="char" char="." valign="top">0.2323</td><td align="char" char="." valign="top">0.1597</td></tr><tr><td align="left" valign="top">BERT<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup></td><td align="char" char="." valign="top">0.0818</td><td align="char" char="." valign="top">0.3854</td><td align="char" char="." valign="top">0.1200</td><td align="char" char="." valign="top">0.0681</td></tr><tr><td align="left" valign="top">Fine-tuned BERT</td><td align="char" char="." valign="top">0.2297</td><td align="char" char="." valign="top">0.1686</td><td align="char" char="." valign="top">0.1723</td><td align="char" char="." valign="top">0.1290</td></tr><tr><td align="left" valign="top" colspan="5">No RAG<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mistral-7B</td><td align="char" char="." valign="top">0.0079</td><td align="char" char="." valign="top">0.0506</td><td align="char" char="." valign="top">0.0077</td><td align="char" char="." valign="top">0.0071</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Qwen3-14B</td><td align="char" char="." valign="top">0.0129</td><td align="char" char="." valign="top">0.0148</td><td align="char" char="." valign="top">0.0132</td><td align="char" char="." valign="top">0.0129</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Llama3.3-70B</td><td align="char" char="." valign="top">0.0142</td><td align="char" char="." valign="top">0.0131</td><td align="char" char="." valign="top">0.0134</td><td align="char" char="." valign="top">0.0130</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>DeepSeek-R1</td><td align="char" char="." valign="top">0.0203</td><td align="char" char="." valign="top">0.0182</td><td align="char" char="." valign="top">0.0189</td><td align="char" char="." valign="top">0.0166</td></tr><tr><td align="left" valign="top" colspan="5">RAG+zero-shot</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mistral-7B</td><td align="char" char="." valign="top">0.3885</td><td align="char" char="." valign="top">0.2411</td><td align="char" char="." valign="top">0.2744</td><td align="char" char="." valign="top">0.1907</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Qwen3-14B</td><td align="char" char="." valign="top">0.4874</td><td align="char" char="." valign="top">0.4147</td><td align="char" char="." valign="top">0.4298</td><td align="char" char="." valign="top">0.3174</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Llama3.3-70B</td><td align="char" char="." valign="top">0.4074</td><td align="char" char="." valign="top">0.3932</td><td align="char" char="." valign="top">0.3849</td><td align="char" char="." valign="top">0.2782</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>DeepSeek-R1</td><td align="char" char="." valign="top">0.4973</td><td align="char" char="." valign="top">0.4903</td><td align="char" char="." valign="top">0.4461</td><td align="char" char="." valign="top">0.3563</td></tr><tr><td align="left" valign="top" colspan="5">RAG+few-shot</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mistral-7B</td><td align="char" char="." valign="top">0.5218</td><td align="char" char="." valign="top">0.4049</td><td align="char" char="." valign="top">0.4299</td><td align="char" char="." valign="top">0.3561</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Qwen3-14B</td><td align="char" char="." valign="top">0.6018</td><td align="char" char="." valign="top">0.5458</td><td align="char" char="." valign="top">0.5557</td><td align="char" char="." valign="top">0.5072</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Llama3.3-70B</td><td align="char" char="." valign="top">0.5757</td><td align="char" char="." valign="top">0.4844</td><td align="char" char="." valign="top">0.5052</td><td align="char" char="." valign="top">0.4368</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>DeepSeek-R1</td><td align="char" char="." valign="top"><italic>0.8453</italic></td><td align="char" char="." valign="top"><italic>0.8504</italic></td><td align="char" char="." valign="top"><italic>0.8413</italic></td><td align="char" char="." valign="top"><italic>0.8097</italic></td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>BERT: Bidirectional Encoder Representations from Transformers.</p></fn><fn id="table4fn2"><p><sup>b</sup>RAG: retrieval-augmented generation.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-4"><title>Prompting Strategies</title><p>We evaluated the impact of prompting strategies by comparing zero-shot and few-shot setups across all models. Few-shot prompting consistently improved performance for both nursing diagnoses and interventions. For nursing diagnoses (<xref ref-type="fig" rid="figure4">Figure 4</xref>), <italic>F</italic><sub>1</sub>-score across the 4 models ranged from 0.0716 to 0.216 under RAG+zero-shot and increased to a range of 0.4298 to 0.7836 under RAG+few-shot. Corresponding IoU values ranged from 0.0704 to 0.2003 with RAG+zero-shot and from 0.3914 to 0.7614 with RAG+few-shot. For nursing interventions (<xref ref-type="fig" rid="figure5">Figure 5</xref>), <italic>F</italic><sub>1</sub>-score ranged from 0.2744 to 0.4461 with RAG+zero-shot and improved to 0.4299&#x2010;0.8413 with RAG+few-shot. IoU values ranged from 0.1907 to 0.3563 with RAG+zero-shot and from 0.3561 to 0.8097 with RAG+few-shot. In both tasks, DeepSeek-R1 with RAG+few-shot achieved the best performance. Ablation results for the no-RAG+few-shot configuration are provided in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Model performance for nursing diagnosis recognition under different prompting strategies: (left) retrieval-augmented generation (RAG)+zero-shot prompting and (right) RAG+few-shot prompting. This figure shows the performance of different large language models (Mistral-7B, Qwen3-14B, Llama3.3-70B, and DeepSeek-R1) under zero-shot and few-shot prompting conditions in recognizing Clinical Care Classification nursing diagnoses from free-text intensive care unit nursing records. Metrics include precision, recall, <italic>F</italic><sub>1</sub>-score, and intersection over union (IoU).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e89850_fig04.png"/></fig><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Model performance for nursing intervention recognition under different prompting strategies: (left) retrieval-augmented generation (RAG)+zero-shot prompting and (right) RAG+few-shot prompting. This figure shows the performance of different large language models (Mistral-7B, Qwen3-14B, Llama3.3-70B, and DeepSeek-R1) under zero-shot and few-shot prompting conditions in recognizing Clinical Care Classification nursing diagnoses from free-text intensive care unit nursing records. Metrics include precision, recall, <italic>F</italic><sub>1</sub>-score, and intersection over union (IoU).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e89850_fig05.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>In this study, we developed CNTRAM, a retrieval-augmented terminology mapping framework integrating dense embedding retrieval, retrieval-enhanced prompting, and few-shot LLM guidance to automatically identify nursing diagnoses and interventions from free-text nursing records based on standardized CCC terminology. Our findings demonstrate that combining RAG with carefully designed few-shot examples markedly improves mapping accuracy compared with TF-IDF, BERT, fine-tuned BERT, and zero-shot LLMs. Specifically, our CNTRAM framework, based on DeepSeek-R1, achieved substantial performance improvements in both nursing diagnosis and intervention mapping. These results align with growing evidence that retrieval grounding improves the factual consistency of clinical text generation models [<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref34">34</xref>].</p><p>The core challenge addressed by CNTRAM stems from the semantic characteristics inherent in nursing terminology. Nursing diagnoses are typically abstract conceptual constructs requiring inference, demanding that nurses synthesize multiple clues and arrive at diagnoses through reasoning [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. Many diagnoses represent higher-order concepts that do not explicitly appear in nursing narratives. In contrast, nursing interventions are more concrete, operationalized, and linguistically salient, typically expressed through explicit action verbs such as &#x201C;monitor,&#x201D; &#x201C;turn,&#x201D; or &#x201C;assess.&#x201D; Previous analyses of CCC semantic structure have also noted that intervention concepts are more operationalized and lexically consistent, while diagnostic concepts may overlap semantically and contain broader conceptual boundaries, complicating automated classification [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. These semantic differences likely explain the higher precision and <italic>F</italic><sub>1</sub>-scores observed in mapping nursing interventions and diagnoses in this study. This also underscores the need for technical approaches that support abstraction and reasoning capabilities during nursing terminology standardization.</p><p>On the basis of the professional attributes of nursing terminology, the performance advantages of the CNTRAM constructed in this study are primarily demonstrated through its 3 components. First, the RAG module retrieves contextually relevant CCC entries for each subquery, providing semantic grounding that reduces ambiguity and stabilizes concept alignment [<xref ref-type="bibr" rid="ref39">39</xref>]. This design is consistent with growing evidence that retrieval augmentation improves reliability in medical question answering and EHR summarization [<xref ref-type="bibr" rid="ref40">40</xref>]. Second, the 2-stage generation structure enforces strict adherence to CCC coding rules while producing stable JSON outputs that support downstream analysis. Finally, few-shot examples offer essential syntactic and semantic anchors for interpreting abstract or compositionally complex nursing expressions such as &#x201C;airway clearance impairment,&#x201D; &#x201C;aspiration risk,&#x201D; &#x201C;infection risk,&#x201D; &#x201C;venous catheter care,&#x201D; and &#x201C;positioning therapy.&#x201D; Evidence from biomedical natural language processing similarly shows that combining retrieval with example-guided prompting markedly improves terminology normalization when annotated data are scarce [<xref ref-type="bibr" rid="ref41">41</xref>].</p><p>Beyond task-level performance, CNTRAM maintains methodological continuity with broader concept normalization research while advancing terminology standardization in nursing. Within medical concept normalization, hybrid approaches that integrate rule-based matching, multilevel semantic similarity, machine learning, or multistage LLM workflows have become increasingly prominent for Unified Medical Language System or Systematized Nomenclature of Medicine&#x2013;Clinical Terms normalization [<xref ref-type="bibr" rid="ref42">42</xref>-<xref ref-type="bibr" rid="ref44">44</xref>]. Meanwhile, nursing informatics literature has long emphasized that SNTs enhance interoperability and enable meaningful analysis of nursing patterns [<xref ref-type="bibr" rid="ref45">45</xref>]. Previous cross-mapping studies demonstrated the feasibility of aligning narrative nursing documentation with vocabularies such as NANDA-I and NIC, although manual mapping workflows proved time consuming and inconsistent across institutions [<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref47">47</xref>]. By demonstrating that retrieval-enhanced LLMs can adapt effectively to nursing-specific terminology systems and documentation practices, CNTRAM extends these research directions and offers a practical pathway for automated nursing terminology mapping in real-world environments. Additionally, in this study, the use of LLMs with varying parameter scales showed differing recognition performance. Among them, DeepSeek-R1 outperformed the other models, likely due to its stronger reasoning ability, instruction-following capacity, and better adaptation to Chinese clinical text. This reasoning advantage allows it to handle ambiguous or complex medical and nursing expressions more effectively [<xref ref-type="bibr" rid="ref29">29</xref>]. Coupled with reliable instruction-following capacity, this ensures accurate mapping within the constrained output schema [<xref ref-type="bibr" rid="ref48">48</xref>]. Moreover, its specialization in Chinese clinical data further enhances its ability to accurately map nursing terminology, which is essential given the unique linguistic and contextual features of Chinese clinical language [<xref ref-type="bibr" rid="ref49">49</xref>].</p><p>From a nursing practice perspective, CNTRAM offers a scalable method for converting unstructured nursing records into structured, analyzable data. Identifying nursing practice features, such as nursing diagnoses and interventions, within practitioners&#x2019; observation records helps validate the value of SNT for enhancing interoperability and the applicability of nursing data [<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref51">51</xref>]. By identifying patients&#x2019; nursing problems and clarifying corresponding nursing actions, CNTRAM can provide a clinically interpretable basis for risk stratification and outcome assessment. Recent observational evidence further supports this direction. Studies from Italian pediatric [<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref53">53</xref>] and adult oncology settings [<xref ref-type="bibr" rid="ref54">54</xref>] have shown that CCC-based nursing data can capture nursing care complexity and are associated with intrahospital and ICU transfers, diagnosis related group&#x2013;based medical complexity, and length of stay. These findings reinforce the potential of structured nursing data to reflect patient risk and care demand. Accordingly, the CCC-coded information produced by CNTRAM offers a structured foundation that can be incorporated into future analyses of complexity, outcomes, and resource use. In addition, the high IoU score achieved in this study indicates the model&#x2019;s ability to effectively represent comprehensive sets of nursing diagnoses and interventions, reflecting the combinatorial nature of the nursing process. Notably, nursing diagnoses such as risk of infection and risk of aspiration require comprehensive judgment based on multiple clinical conditions and are prone to certain recognition errors [<xref ref-type="bibr" rid="ref55">55</xref>]. Generalized nursing interventions, such as clinical measurements and physical examination, may have mapping biases due to unclear classification granularity [<xref ref-type="bibr" rid="ref56">56</xref>]. Misclassification of nursing diagnoses can affect nurses&#x2019; risk stratification assessment of patients, while misclassification of nursing interventions may disturb the calculation of nursing workload and the correlation between intervention frequency and patient risk [<xref ref-type="bibr" rid="ref57">57</xref>]. In practical application, CNTRAM outputs can serve as an aid for clinical decision support and documentation, but they still require judgment and review by clinical nurses.</p></sec><sec id="s4-2"><title>Limitations and Future Work</title><p>However, this study has several limitations. First, the analysis was based on data from a single ICU with a relatively limited dataset, and the test set covered only a subset of commonly used CCC codes. This partial coverage constrains our ability to generalize the findings to the full CCC terminology system. Second, although few-shot prompting improved model performance, it introduced a dependence on manually curated examples. Such reliance may lead to sampling bias. Third, as highlighted in recent health care RAG literature, robust evaluation frameworks are essential to mitigate issues related to bias, trust, and privacy [<xref ref-type="bibr" rid="ref58">58</xref>]. Future research could further validate the generalization capability of CNTRAM through multicenter and multilingual data verification. Additionally, the flexibility of CNTRAM to adapt to different nursing terminology systems, such as NANDA-I, NIC, and International Classification for Nursing Practice, could be examined. This would involve integrating diverse domain knowledge resources into the RAG framework to enhance semantic granularity and expand the coverage of terminology mapping [<xref ref-type="bibr" rid="ref59">59</xref>]. Furthermore, embedding CNTRAM into EHR systems for real-time semantic standardization could provide actionable support for nursing practice and clinical decision-making.</p></sec><sec id="s4-3"><title>Conclusions</title><p>In this study, we developed CNTRAM, an LLM-based 2-stage RAG framework designed to map free-text nursing records to the CCC terminology. CNTRAM combines dense embedding retrieval and few-shot prompting. Using DeepSeek-R1 as its backbone LLM, this framework outperformed traditional methods, no-RAG models, and zero-shot prompting approaches. The results demonstrate that the integration of RAG, few-shot learning, and LLMs improves mapping accuracy and offers a feasible solution for mapping unstructured nursing data to standardized terminologies.</p></sec></sec></body><back><ack><p>The authors thank Zhang Lei for proofreading the manuscript. During the preparation of this manuscript, the authors used DeepSeek-R1 (DeepSeek) to improve language and readability. After using this tool, the authors reviewed and edited the content as needed and take full responsibility for the content of the published paper.</p></ack><notes><sec><title>Funding</title><p>The authors declare that no financial support was received for this study.</p></sec><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are not publicly available due to institutional and ethical restrictions but are available from the corresponding author on reasonable request, subject to approval by the relevant institutional ethics committee. The code used in this study is publicly available [<xref ref-type="bibr" rid="ref60">60</xref>].</p><p/></sec></notes><fn-group><fn fn-type="con"><p>ML and DC, as co&#x2013;first authors, contributed equally to this study and were jointly responsible for conceptualization and drafting the original manuscript. QX and ZH contributed to data interpretation and results review. YZ and JZ prepared the figures and tables. YL contributed to writing, review, and editing. HM, as the corresponding author, led study supervision and project administration and critically revised the manuscript. All authors reviewed and approved the final manuscript.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">BAAI</term><def><p>Beijing Academy of Artificial Intelligence</p></def></def-item><def-item><term id="abb2">BERT</term><def><p>Bidirectional Encoder Representations from Transformers</p></def></def-item><def-item><term id="abb3">CCC</term><def><p>Clinical Care Classification</p></def></def-item><def-item><term id="abb4">CNTRAM</term><def><p>Clinical Care Classification nursing terminology with retrieval-augmented mapping</p></def></def-item><def-item><term id="abb5">EHR</term><def><p>electronic health record</p></def></def-item><def-item><term id="abb6">ICU</term><def><p>intensive care unit</p></def></def-item><def-item><term id="abb7">IoU</term><def><p>intersection over union</p></def></def-item><def-item><term id="abb8">LLM</term><def><p>large language model</p></def></def-item><def-item><term id="abb9">NANDA-I</term><def><p>North American Nursing Diagnosis Association International</p></def></def-item><def-item><term id="abb10">NIC</term><def><p>Nursing Interventions Classification</p></def></def-item><def-item><term id="abb11">RAG</term><def><p>retrieval-augmented generation</p></def></def-item><def-item><term id="abb12">SNT</term><def><p>standardized nursing terminology</p></def></def-item><def-item><term id="abb13">TF-IDF</term><def><p>term frequency&#x2013;inverse document frequency</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Opmeer</surname><given-names>BC</given-names> </name></person-group><article-title>Electronic health records as sources of research data</article-title><source>JAMA</source><year>2016</year><month>01</month><day>12</day><volume>315</volume><issue>2</issue><fpage>201</fpage><lpage>202</lpage><pub-id pub-id-type="doi">10.1001/jama.2015.15419</pub-id><pub-id pub-id-type="medline">26757473</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Anderson</surname><given-names>C</given-names> </name><name name-style="western"><surname>Kaul</surname><given-names>M</given-names> </name><name name-style="western"><surname>Gullapalli</surname><given-names>N</given-names> </name><name name-style="western"><surname>Pitani</surname><given-names>S</given-names> </name></person-group><article-title>Electronic health records and clinical documentation in medical residency programs: preparing residents to become master clinicians</article-title><source>J Am Med Inform Assoc</source><year>2023</year><month>11</month><day>17</day><volume>30</volume><issue>12</issue><fpage>1965</fpage><lpage>1972</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocad158</pub-id><pub-id pub-id-type="medline">37573135</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Salanter&#x00E4;</surname><given-names>S</given-names> </name></person-group><article-title>Advanced use of electronic health records: the depth of nursing notes</article-title><source>Nurs Res</source><year>2015</year><volume>64</volume><issue>6</issue><fpage>411</fpage><lpage>412</lpage><pub-id pub-id-type="doi">10.1097/NNR.0000000000000129</pub-id><pub-id pub-id-type="medline">26505153</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>von Gerich</surname><given-names>H</given-names> </name><name name-style="western"><surname>Moen</surname><given-names>H</given-names> </name><name name-style="western"><surname>Peltonen</surname><given-names>LM</given-names> </name></person-group><article-title>Identifying nursing sensitive indicators from electronic health records in acute cardiac care-towards intelligent automated assessment of care quality</article-title><source>J Nurs Manag</source><year>2022</year><month>11</month><volume>30</volume><issue>8</issue><fpage>3726</fpage><lpage>3735</lpage><pub-id pub-id-type="doi">10.1111/jonm.13802</pub-id><pub-id pub-id-type="medline">36124426</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Macieira</surname><given-names>TGR</given-names> </name><name name-style="western"><surname>Chianca</surname><given-names>TCM</given-names> </name><name name-style="western"><surname>Smith</surname><given-names>MB</given-names> </name><etal/></person-group><article-title>Secondary use of standardized nursing care data for advancing nursing science and practice: a systematic review</article-title><source>J Am Med Inform Assoc</source><year>2019</year><month>11</month><day>1</day><volume>26</volume><issue>11</issue><fpage>1401</fpage><lpage>1411</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocz086</pub-id><pub-id pub-id-type="medline">31188439</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Monsen</surname><given-names>KA</given-names> </name><name name-style="western"><surname>Heermann</surname><given-names>L</given-names> </name><name name-style="western"><surname>Dunn-Lopez</surname><given-names>K</given-names> </name></person-group><article-title>FHIR-up! Advancing knowledge from clinical data through application of standardized nursing terminologies within HL7&#x00AE; FHIR&#x00AE;</article-title><source>J Am Med Inform Assoc</source><year>2023</year><month>10</month><day>19</day><volume>30</volume><issue>11</issue><fpage>1858</fpage><lpage>1864</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocad131</pub-id><pub-id pub-id-type="medline">37428893</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>T</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Peng</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Effectiveness of standardized nursing terminologies for nursing practice and healthcare outcomes: a systematic review</article-title><source>Int J Nurs Knowl</source><year>2021</year><month>10</month><volume>32</volume><issue>4</issue><fpage>220</fpage><lpage>228</lpage><pub-id pub-id-type="doi">10.1111/2047-3095.12315</pub-id><pub-id pub-id-type="medline">33580632</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Saba</surname><given-names>VK</given-names> </name><name name-style="western"><surname>Taylor</surname><given-names>SL</given-names> </name></person-group><article-title>Moving past theory: use of a standardized, coded nursing terminology to enhance nursing visibility</article-title><source>Comput Inform Nurs</source><year>2007</year><volume>25</volume><issue>6</issue><fpage>324</fpage><lpage>331</lpage><pub-id pub-id-type="doi">10.1097/01.NCN.0000299654.13777.9f</pub-id><pub-id pub-id-type="medline">18000428</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Feng</surname><given-names>RC</given-names> </name><name name-style="western"><surname>Tseng</surname><given-names>KJ</given-names> </name><name name-style="western"><surname>Yan</surname><given-names>HF</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>HY</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>P</given-names> </name></person-group><article-title>A preliminary study on the use of clinical care classification in nursing documentation data sets</article-title><source>Comput Methods Programs Biomed</source><year>2013</year><month>12</month><volume>112</volume><issue>3</issue><fpage>713</fpage><lpage>719</lpage><pub-id pub-id-type="doi">10.1016/j.cmpb.2013.07.019</pub-id><pub-id pub-id-type="medline">24079965</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kang</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Dykes</surname><given-names>PC</given-names> </name><name name-style="western"><surname>Korach</surname><given-names>TZ</given-names> </name><etal/></person-group><article-title>Identifying nurses&#x2019; concern concepts about patient deterioration using a standard nursing terminology</article-title><source>Int J Med Inform</source><year>2020</year><month>01</month><volume>133</volume><fpage>104016</fpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2019.104016</pub-id><pub-id pub-id-type="medline">31707264</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="web"><article-title>Clinical nursing terminology index</article-title><source>Zhongwei Nursing Information Research Institute</source><access-date>2026-04-15</access-date><comment><ext-link ext-link-type="uri" xlink:href="http://zwini.org.cn/nurseinfo-web/page/nurseterms/index">http://zwini.org.cn/nurseinfo-web/page/nurseterms/index</ext-link></comment></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Feng</surname><given-names>RC</given-names> </name><name name-style="western"><surname>Tseng</surname><given-names>KJ</given-names> </name><name name-style="western"><surname>Yan</surname><given-names>HF</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>HY</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>P</given-names> </name></person-group><article-title>Capability of using clinical care classification system to represent nursing practice in acute setting in Taiwan</article-title><source>NI 2012 (2012)</source><year>2012</year><volume>2012</volume><fpage>113</fpage><pub-id pub-id-type="medline">24199066</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Choi</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>Y</given-names> </name></person-group><article-title>Development of a mapping table for nursing notes based on nurses&#x2019; concerns in ICU patients</article-title><source>Stud Health Technol Inform</source><year>2024</year><month>07</month><day>24</day><volume>315</volume><fpage>725</fpage><lpage>726</lpage><pub-id pub-id-type="doi">10.3233/SHTI240299</pub-id><pub-id pub-id-type="medline">39049400</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Torres</surname><given-names>FBG</given-names> </name><name name-style="western"><surname>Gomes</surname><given-names>DC</given-names> </name><name name-style="western"><surname>Hino</surname><given-names>AAF</given-names> </name><name name-style="western"><surname>Moro</surname><given-names>C</given-names> </name><name name-style="western"><surname>Cubas</surname><given-names>MR</given-names> </name></person-group><article-title>Comparison of the results of manual and automated processes of cross-mapping between nursing terms: quantitative study</article-title><source>JMIR Nurs</source><year>2020</year><volume>3</volume><issue>1</issue><fpage>e18501</fpage><pub-id pub-id-type="doi">10.2196/18501</pub-id><pub-id pub-id-type="medline">34345784</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Elvas</surname><given-names>LB</given-names> </name><name name-style="western"><surname>Almeida</surname><given-names>A</given-names> </name><name name-style="western"><surname>Ferreira</surname><given-names>JC</given-names> </name></person-group><article-title>Natural language processing in medical text processing: a scoping literature review</article-title><source>Int J Med Inform</source><year>2025</year><month>12</month><volume>204</volume><fpage>106049</fpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2025.106049</pub-id><pub-id pub-id-type="medline">40706199</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hossain</surname><given-names>E</given-names> </name><name name-style="western"><surname>Rana</surname><given-names>R</given-names> </name><name name-style="western"><surname>Higgins</surname><given-names>N</given-names> </name><etal/></person-group><article-title>Natural language processing in electronic health records in relation to healthcare decision-making: a systematic review</article-title><source>Comput Biol Med</source><year>2023</year><month>03</month><volume>155</volume><fpage>106649</fpage><pub-id pub-id-type="doi">10.1016/j.compbiomed.2023.106649</pub-id><pub-id pub-id-type="medline">36805219</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Korach</surname><given-names>ZT</given-names> </name><name name-style="western"><surname>Cato</surname><given-names>KD</given-names> </name><name name-style="western"><surname>Collins</surname><given-names>SA</given-names> </name><etal/></person-group><article-title>Unsupervised machine learning of topics documented by nurses about hospitalized patients prior to a rapid-response event</article-title><source>Appl Clin Inform</source><year>2019</year><month>10</month><volume>10</volume><issue>5</issue><fpage>952</fpage><lpage>963</lpage><pub-id pub-id-type="doi">10.1055/s-0039-3401814</pub-id><pub-id pub-id-type="medline">31853936</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Redjdal</surname><given-names>A</given-names> </name><name name-style="western"><surname>Novikava</surname><given-names>N</given-names> </name><name name-style="western"><surname>Kempf</surname><given-names>E</given-names> </name><name name-style="western"><surname>Bouaud</surname><given-names>J</given-names> </name><name name-style="western"><surname>Seroussi</surname><given-names>B</given-names> </name></person-group><article-title>Leveraging rule-based NLP to translate textual reports as structured inputs automatically processed by a clinical decision support system</article-title><source>Stud Health Technol Inform</source><year>2024</year><month>08</month><day>22</day><volume>316</volume><fpage>1861</fpage><lpage>1865</lpage><pub-id pub-id-type="doi">10.3233/SHTI240794</pub-id><pub-id pub-id-type="medline">39176854</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lou</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>K</given-names> </name></person-group><article-title>Dictionary-based matching graph network for biomedical named entity recognition</article-title><source>Sci Rep</source><year>2023</year><month>12</month><day>8</day><volume>13</volume><issue>1</issue><fpage>21667</fpage><pub-id pub-id-type="doi">10.1038/s41598-023-48564-w</pub-id><pub-id pub-id-type="medline">38066007</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nishigaki</surname><given-names>D</given-names> </name><name name-style="western"><surname>Suzuki</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wataya</surname><given-names>T</given-names> </name><etal/></person-group><article-title>BERT-based transfer learning in sentence-level anatomic classification of free-text radiology reports</article-title><source>Radiol Artif Intell</source><year>2023</year><volume>5</volume><issue>2</issue><fpage>e220097</fpage><pub-id pub-id-type="doi">10.1148/ryai.220097</pub-id><pub-id pub-id-type="medline">37035437</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xiao</surname><given-names>H</given-names> </name><name name-style="western"><surname>Zhou</surname><given-names>F</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>X</given-names> </name><etal/></person-group><article-title>A comprehensive survey of large language models and multimodal large language models in medicine</article-title><source>Inf Fusion</source><year>2025</year><month>05</month><volume>117</volume><issue>C</issue><fpage>102888</fpage><pub-id pub-id-type="doi">10.1016/j.inffus.2024.102888</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ke</surname><given-names>YH</given-names> </name><name name-style="western"><surname>Jin</surname><given-names>L</given-names> </name><name name-style="western"><surname>Elangovan</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Retrieval augmented generation for 10 large language models and its generalizability in assessing medical fitness</article-title><source>NPJ Digit Med</source><year>2025</year><month>04</month><day>5</day><volume>8</volume><issue>1</issue><fpage>187</fpage><pub-id pub-id-type="doi">10.1038/s41746-025-01519-z</pub-id><pub-id pub-id-type="medline">40185842</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xu</surname><given-names>R</given-names> </name><name name-style="western"><surname>Hong</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>F</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>H</given-names> </name></person-group><article-title>Evaluation of the integration of retrieval-augmented generation in large language model for breast cancer nursing care responses</article-title><source>Sci Rep</source><year>2024</year><month>12</month><day>28</day><volume>14</volume><issue>1</issue><fpage>30794</fpage><pub-id pub-id-type="doi">10.1038/s41598-024-81052-3</pub-id><pub-id pub-id-type="medline">39730573</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="web"><article-title>JSON Output</article-title><source>DeepSeek API Docs</source><access-date>2026-04-15</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://api-docs.deepseek.com/guides/json_mode">https://api-docs.deepseek.com/guides/json_mode</ext-link></comment></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Bafna</surname><given-names>P</given-names> </name><name name-style="western"><surname>Pramod</surname><given-names>D</given-names> </name><name name-style="western"><surname>Vaidya</surname><given-names>A</given-names> </name></person-group><article-title>Document clustering: TF-IDF approach</article-title><conf-name>2016 International Conference on Electrical, Electronics, and Optimization Techniques (ICEEOT)</conf-name><conf-date>Mar 3-5, 2016</conf-date><pub-id pub-id-type="doi">10.1109/ICEEOT.2016.7754750</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Grattafiori</surname><given-names>A</given-names> </name><name name-style="western"><surname>Dubey</surname><given-names>A</given-names> </name><name name-style="western"><surname>Jauhri</surname><given-names>A</given-names> </name><name name-style="western"><surname>Pandey</surname><given-names>A</given-names> </name><name name-style="western"><surname>Kadian</surname><given-names>A</given-names> </name><name name-style="western"><surname>Al-Dahle</surname><given-names>A</given-names> </name><etal/></person-group><article-title>The Llama 3 herd of models</article-title><source>arXiv</source><comment>Preprint posted online on  Jul 31, 2024</comment><pub-id pub-id-type="doi">10.48550/arXiv.2407.21783</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>A</given-names> </name><name name-style="western"><surname>Li</surname><given-names>A</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>B</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>B</given-names> </name><name name-style="western"><surname>Hui</surname><given-names>B</given-names> </name><name name-style="western"><surname>Zheng</surname><given-names>B</given-names> </name><etal/></person-group><article-title>Qwen3 technical report</article-title><source>arXiv</source><comment>Preprint posted online on  May 14, 2025</comment><pub-id pub-id-type="doi">10.48550/arXiv.2505.09388</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Jiang</surname><given-names>AQ</given-names> </name><name name-style="western"><surname>Sablayrolles</surname><given-names>A</given-names> </name><name name-style="western"><surname>Mensch</surname><given-names>A</given-names> </name><name name-style="western"><surname>Bamford</surname><given-names>C</given-names> </name><name name-style="western"><surname>Chaplot</surname><given-names>DS</given-names> </name></person-group><article-title>Mistral 7B</article-title><source>arXiv</source><comment>Preprint posted online on  Oct 10, 2023</comment><pub-id pub-id-type="doi">10.48550/arXiv.2310.06825</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Guo</surname><given-names>D</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>D</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>H</given-names> </name><etal/></person-group><article-title>DeepSeek-R1 incentivizes reasoning in LLMs through reinforcement learning</article-title><source>Nature</source><year>2025</year><month>09</month><volume>645</volume><issue>8081</issue><fpage>633</fpage><lpage>638</lpage><pub-id pub-id-type="doi">10.1038/s41586-025-09422-z</pub-id><pub-id pub-id-type="medline">40962978</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Levy</surname><given-names>O</given-names> </name><name name-style="western"><surname>Seo</surname><given-names>M</given-names> </name><name name-style="western"><surname>Choi</surname><given-names>E</given-names> </name><name name-style="western"><surname>Zettlemoyer</surname><given-names>L</given-names> </name></person-group><article-title>Zero-shot relation extraction via reading comprehension</article-title><conf-name>Proceedings of the 21st Conference on Computational Natural Language Learning (CoNLL 2017)</conf-name><conf-date>Aug 3-4, 2017</conf-date><pub-id pub-id-type="doi">10.18653/v1/K17-1034</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Parnami</surname><given-names>A</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>M</given-names> </name></person-group><article-title>Learning from few examples: a summary of approaches to few-shot learning</article-title><source>ArXiv</source><comment>Preprint posted online on  Mar 7, 2022</comment><pub-id pub-id-type="doi">10.48550/arXiv.2203.04291</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>M</given-names> </name><name name-style="western"><surname>Zhan</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Benchmarking retrieval-augmented large language models in biomedical NLP: application, robustness, and self-awareness</article-title><source>Sci Adv</source><year>2025</year><month>11</month><day>21</day><volume>11</volume><issue>47</issue><fpage>eadr1443</fpage><pub-id pub-id-type="doi">10.1126/sciadv.adr1443</pub-id><pub-id pub-id-type="medline">41270181</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Koga</surname><given-names>S</given-names> </name><name name-style="western"><surname>Ono</surname><given-names>D</given-names> </name><name name-style="western"><surname>Obstfeld</surname><given-names>A</given-names> </name></person-group><article-title>Retrieval-augmented generation versus document-grounded generation: a key distinction in large language models</article-title><source>J Pathol Clin Res</source><year>2025</year><month>01</month><volume>11</volume><issue>1</issue><fpage>e70014</fpage><pub-id pub-id-type="doi">10.1002/2056-4538.70014</pub-id><pub-id pub-id-type="medline">39817433</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alkhalaf</surname><given-names>M</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>P</given-names> </name><name name-style="western"><surname>Yin</surname><given-names>M</given-names> </name><name name-style="western"><surname>Deng</surname><given-names>C</given-names> </name></person-group><article-title>Applying generative AI with retrieval augmented generation to summarize and extract key clinical information from electronic health records</article-title><source>J Biomed Inform</source><year>2024</year><month>08</month><volume>156</volume><fpage>104662</fpage><pub-id pub-id-type="doi">10.1016/j.jbi.2024.104662</pub-id><pub-id pub-id-type="medline">38880236</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pirret</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Neville</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>La Grow</surname><given-names>SJ</given-names> </name></person-group><article-title>Nurse practitioners versus doctors diagnostic reasoning in a complex case presentation to an acute tertiary hospital: a comparative study</article-title><source>Int J Nurs Stud</source><year>2015</year><month>03</month><volume>52</volume><issue>3</issue><fpage>716</fpage><lpage>726</lpage><pub-id pub-id-type="doi">10.1016/j.ijnurstu.2014.08.009</pub-id><pub-id pub-id-type="medline">25234268</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Smith</surname><given-names>SK</given-names> </name><name name-style="western"><surname>Benbenek</surname><given-names>MM</given-names> </name><name name-style="western"><surname>Bakker</surname><given-names>CJ</given-names> </name><name name-style="western"><surname>Bockwoldt</surname><given-names>D</given-names> </name></person-group><article-title>Scoping review: diagnostic reasoning as a component of clinical reasoning in the U.S. primary care nurse practitioner education</article-title><source>J Adv Nurs</source><year>2022</year><month>12</month><volume>78</volume><issue>12</issue><fpage>3869</fpage><lpage>3896</lpage><pub-id pub-id-type="doi">10.1111/jan.15414</pub-id><pub-id pub-id-type="medline">35986584</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fine</surname><given-names>S</given-names> </name><name name-style="western"><surname>Chaudhri</surname><given-names>A</given-names> </name><name name-style="western"><surname>Englebright</surname><given-names>J</given-names> </name><name name-style="western"><surname>Dan Roberts</surname><given-names>W</given-names> </name></person-group><article-title>Nursing process, derived from the clinical care classification system components, as an earlier indicator of nursing care during a pandemic</article-title><source>Int J Med Inform</source><year>2023</year><month>05</month><volume>173</volume><fpage>104954</fpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2022.104954</pub-id><pub-id pub-id-type="medline">36842361</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jansen</surname><given-names>K</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>TY</given-names> </name><name name-style="western"><surname>Coenen</surname><given-names>A</given-names> </name><name name-style="western"><surname>Saba</surname><given-names>V</given-names> </name><name name-style="western"><surname>Hardiker</surname><given-names>N</given-names> </name></person-group><article-title>Harmonising nursing terminologies using a conceptual framework</article-title><source>Stud Health Technol Inform</source><year>2016</year><volume>225</volume><fpage>471</fpage><lpage>475</lpage><pub-id pub-id-type="medline">27332245</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Zhong</surname><given-names>M</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Honda</surname><given-names>N</given-names> </name></person-group><article-title>Deep learning based dense retrieval: a comparative study</article-title><source>ArXiv</source><comment>Preprint posted online on  Oct 27, 2024</comment><pub-id pub-id-type="doi">10.48550/arXiv.2410.20315</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>S</given-names> </name><name name-style="western"><surname>McCoy</surname><given-names>AB</given-names> </name><name name-style="western"><surname>Wright</surname><given-names>A</given-names> </name></person-group><article-title>Improving large language model applications in biomedicine with retrieval-augmented generation: a systematic review, meta-analysis, and clinical development guidelines</article-title><source>J Am Med Inform Assoc</source><year>2025</year><month>04</month><day>1</day><volume>32</volume><issue>4</issue><fpage>605</fpage><lpage>615</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocaf008</pub-id><pub-id pub-id-type="medline">39812777</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kresevic</surname><given-names>S</given-names> </name><name name-style="western"><surname>Giuffr&#x00E8;</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ajcevic</surname><given-names>M</given-names> </name><name name-style="western"><surname>Accardo</surname><given-names>A</given-names> </name><name name-style="western"><surname>Croc&#x00E8;</surname><given-names>LS</given-names> </name><name name-style="western"><surname>Shung</surname><given-names>DL</given-names> </name></person-group><article-title>Optimization of hepatological clinical guidelines interpretation by large language models: a retrieval augmented generation-based framework</article-title><source>NPJ Digit Med</source><year>2024</year><month>04</month><day>23</day><volume>7</volume><issue>1</issue><fpage>102</fpage><pub-id pub-id-type="doi">10.1038/s41746-024-01091-y</pub-id><pub-id pub-id-type="medline">38654102</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>L</given-names> </name><name name-style="western"><surname>Fu</surname><given-names>W</given-names> </name><name name-style="western"><surname>Gu</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Clinical concept normalization with a hybrid natural language processing system combining multilevel matching and machine learning ranking</article-title><source>J Am Med Inform Assoc</source><year>2020</year><month>10</month><day>1</day><volume>27</volume><issue>10</issue><fpage>1576</fpage><lpage>1584</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocaa155</pub-id><pub-id pub-id-type="medline">33029642</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yoon</surname><given-names>D</given-names> </name><name name-style="western"><surname>Han</surname><given-names>C</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>DW</given-names> </name><etal/></person-group><article-title>Redefining health care data interoperability: empirical exploration of large language models in information exchange</article-title><source>J Med Internet Res</source><year>2024</year><month>05</month><day>31</day><volume>26</volume><fpage>e56614</fpage><pub-id pub-id-type="doi">10.2196/56614</pub-id><pub-id pub-id-type="medline">38819879</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Afshar</surname><given-names>M</given-names> </name><name name-style="western"><surname>Gao</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Gupta</surname><given-names>D</given-names> </name><name name-style="western"><surname>Croxford</surname><given-names>E</given-names> </name><name name-style="western"><surname>Demner-Fushman</surname><given-names>D</given-names> </name></person-group><article-title>On the role of the UMLS in supporting diagnosis generation proposed by large language models</article-title><source>J Biomed Inform</source><year>2024</year><month>09</month><volume>157</volume><fpage>104707</fpage><pub-id pub-id-type="doi">10.1016/j.jbi.2024.104707</pub-id><pub-id pub-id-type="medline">39142598</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dunn Lopez</surname><given-names>K</given-names> </name><name name-style="western"><surname>Heermann Langford</surname><given-names>L</given-names> </name><name name-style="western"><surname>Kennedy</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Future advancement of health care through standardized nursing terminologies: reflections from a Friends of the National Library of Medicine workshop honoring Virginia K. Saba</article-title><source>J Am Med Inform Assoc</source><year>2023</year><month>10</month><day>19</day><volume>30</volume><issue>11</issue><fpage>1878</fpage><lpage>1884</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocad156</pub-id><pub-id pub-id-type="medline">37553233</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>D&#x2019;Agostino</surname><given-names>F</given-names> </name><name name-style="western"><surname>Zeffiro</surname><given-names>V</given-names> </name><name name-style="western"><surname>Vellone</surname><given-names>E</given-names> </name><etal/></person-group><article-title>Cross-mapping of nursing care terms recorded in Italian hospitals into the standardized NNN terminology</article-title><source>Int J Nurs Knowl</source><year>2020</year><month>01</month><volume>31</volume><issue>1</issue><fpage>4</fpage><lpage>13</lpage><pub-id pub-id-type="doi">10.1111/2047-3095.12200</pub-id><pub-id pub-id-type="medline">29328554</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Juv&#x00E9; Udina</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Gonzalez Samartino</surname><given-names>M</given-names> </name><name name-style="western"><surname>Matud Calvo</surname><given-names>C</given-names> </name></person-group><article-title>Mapping the diagnosis axis of an interface terminology to the NANDA international taxonomy</article-title><source>ISRN Nurs</source><year>2012</year><volume>2012</volume><fpage>676905</fpage><pub-id pub-id-type="doi">10.5402/2012/676905</pub-id><pub-id pub-id-type="medline">22830046</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>X</given-names> </name><name name-style="western"><surname>Liao</surname><given-names>B</given-names> </name><name name-style="western"><surname>Qi</surname><given-names>J</given-names> </name><name name-style="western"><surname>Eustratiadis</surname><given-names>P</given-names> </name><name name-style="western"><surname>Monz</surname><given-names>C</given-names> </name><name name-style="western"><surname>Bisazza</surname><given-names>A</given-names> </name><etal/></person-group><article-title>The SIFo benchmark: investigating the sequential instruction following ability of large language models</article-title><conf-name>Findings of the Association for Computational Linguistics: EMNLP 2024</conf-name><conf-date>Nov 12-16, 2024</conf-date><pub-id pub-id-type="doi">10.18653/v1/2024.findings-emnlp.92</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yao</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Duan</surname><given-names>L</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Chi</surname><given-names>L</given-names> </name><name name-style="western"><surname>Sheng</surname><given-names>D</given-names> </name></person-group><article-title>Performance of large language models in the non-English context: qualitative study of models trained on different languages in Chinese medical examinations</article-title><source>JMIR Med Inform</source><year>2025</year><month>06</month><day>27</day><volume>13</volume><fpage>e69485</fpage><pub-id pub-id-type="doi">10.2196/69485</pub-id><pub-id pub-id-type="medline">40577654</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jedwab</surname><given-names>RM</given-names> </name><name name-style="western"><surname>Holzhauser</surname><given-names>K</given-names> </name><name name-style="western"><surname>Raghunathan</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Applicability and benefits of standardised nursing terminology in Australia: a scoping review</article-title><source>Collegian</source><year>2024</year><month>12</month><volume>31</volume><issue>6</issue><fpage>404</fpage><lpage>420</lpage><pub-id pub-id-type="doi">10.1016/j.colegn.2024.10.001</pub-id></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ranegger</surname><given-names>R</given-names> </name><name name-style="western"><surname>Baumberger</surname><given-names>D</given-names> </name><name name-style="western"><surname>Grgic</surname><given-names>P</given-names> </name><name name-style="western"><surname>Jagfeld</surname><given-names>G</given-names> </name></person-group><article-title>Semantic interoperability of nursing data - mapping an interface terminology to SNOMED CT</article-title><source>Stud Health Technol Inform</source><year>2024</year><month>08</month><day>22</day><volume>316</volume><fpage>1297</fpage><lpage>1301</lpage><pub-id pub-id-type="doi">10.3233/SHTI240650</pub-id><pub-id pub-id-type="medline">39176619</pub-id></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cesare</surname><given-names>M</given-names> </name><name name-style="western"><surname>D&#x2019;Agostino</surname><given-names>F</given-names> </name><name name-style="western"><surname>Sebastiani</surname><given-names>E</given-names> </name><collab>Nursing And Public Health Group</collab><name name-style="western"><surname>Damiani</surname><given-names>G</given-names> </name><name name-style="western"><surname>Cocchieri</surname><given-names>A</given-names> </name></person-group><article-title>Deciphering the link between diagnosis-related group weight and nursing care complexity in hospitalized children: an observational study</article-title><source>Children (Basel)</source><year>2025</year><month>01</month><day>17</day><volume>12</volume><issue>1</issue><fpage>103</fpage><pub-id pub-id-type="doi">10.3390/children12010103</pub-id><pub-id pub-id-type="medline">39857934</pub-id></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cesare</surname><given-names>M</given-names> </name><name name-style="western"><surname>Cocchieri</surname><given-names>A</given-names> </name></person-group><article-title>Can an increase in nursing care complexity raise the risk of intra-hospital and intensive care unit transfers in children? A retrospective observational study</article-title><source>J Pediatr Nurs</source><year>2025</year><volume>80</volume><fpage>91</fpage><lpage>99</lpage><pub-id pub-id-type="doi">10.1016/j.pedn.2024.11.015</pub-id><pub-id pub-id-type="medline">39602875</pub-id></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cesare</surname><given-names>M</given-names> </name><name name-style="western"><surname>Magliozzi</surname><given-names>E</given-names> </name><name name-style="western"><surname>D&#x2019;Agostino</surname><given-names>F</given-names> </name><name name-style="western"><surname>Zeffiro</surname><given-names>V</given-names> </name><name name-style="western"><surname>Cocchieri</surname><given-names>A</given-names> </name></person-group><article-title>Prevalence and accuracy of nursing diagnoses in patients with malignant bronchial and lung cancer: a retrospective observational study</article-title><source>Eur J Oncol Nurs</source><year>2025</year><month>08</month><volume>77</volume><fpage>102931</fpage><pub-id pub-id-type="doi">10.1016/j.ejon.2025.102931</pub-id><pub-id pub-id-type="medline">40712222</pub-id></nlm-citation></ref><ref id="ref55"><label>55</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hasegawa</surname><given-names>T</given-names> </name><name name-style="western"><surname>Ogasawara</surname><given-names>C</given-names> </name><name name-style="western"><surname>Katz</surname><given-names>EC</given-names> </name></person-group><article-title>Measuring diagnostic competency and the analysis of factors influencing competency using written case studies</article-title><source>Int J Nurs Terminol Classif</source><year>2007</year><volume>18</volume><issue>3</issue><fpage>93</fpage><lpage>102</lpage><pub-id pub-id-type="doi">10.1111/j.1744-618X.2007.00057.x</pub-id><pub-id pub-id-type="medline">17714237</pub-id></nlm-citation></ref><ref id="ref56"><label>56</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Coenen</surname><given-names>A</given-names> </name><name name-style="western"><surname>Ryan</surname><given-names>P</given-names> </name><name name-style="western"><surname>Sutton</surname><given-names>J</given-names> </name></person-group><article-title>Mapping nursing interventions from a hospital information system to the Nursing Interventions Classification (NIC)</article-title><source>Nurs Diagn</source><year>1997</year><volume>8</volume><issue>4</issue><fpage>145</fpage><lpage>151</lpage><pub-id pub-id-type="doi">10.1111/j.1744-618x.1997.tb00469.x</pub-id><pub-id pub-id-type="medline">9624992</pub-id></nlm-citation></ref><ref id="ref57"><label>57</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>M&#x00FC;ller-Staub</surname><given-names>M</given-names> </name><name name-style="western"><surname>Lavin</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Needham</surname><given-names>I</given-names> </name><name name-style="western"><surname>van Achterberg</surname><given-names>T</given-names> </name></person-group><article-title>Nursing diagnoses, interventions and outcomes - application and impact on nursing practice: systematic review</article-title><source>J Adv Nurs</source><year>2006</year><month>12</month><volume>56</volume><issue>5</issue><fpage>514</fpage><lpage>531</lpage><pub-id pub-id-type="doi">10.1111/j.1365-2648.2006.04012.x</pub-id><pub-id pub-id-type="medline">17078827</pub-id></nlm-citation></ref><ref id="ref58"><label>58</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Amugongo</surname><given-names>LM</given-names> </name><name name-style="western"><surname>Mascheroni</surname><given-names>P</given-names> </name><name name-style="western"><surname>Brooks</surname><given-names>S</given-names> </name><name name-style="western"><surname>Doering</surname><given-names>S</given-names> </name><name name-style="western"><surname>Seidel</surname><given-names>J</given-names> </name></person-group><article-title>Retrieval augmented generation for large language models in healthcare: a systematic review</article-title><source>PLOS Digit Health</source><year>2025</year><month>06</month><volume>4</volume><issue>6</issue><fpage>e0000877</fpage><pub-id pub-id-type="doi">10.1371/journal.pdig.0000877</pub-id><pub-id pub-id-type="medline">40498738</pub-id></nlm-citation></ref><ref id="ref59"><label>59</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Zhao</surname><given-names>X</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>SY</given-names> </name><name name-style="western"><surname>Miao</surname><given-names>C</given-names> </name></person-group><article-title>MedRAG: enhancing retrieval-augmented generation with knowledge graph-elicited reasoning for healthcare copilot</article-title><conf-name>WWW &#x2019;25: Proceedings of the ACM on Web Conference 2025</conf-name><conf-date>Apr 28 to May 2, 2025</conf-date><pub-id pub-id-type="doi">10.1145/3696410.3714782</pub-id></nlm-citation></ref><ref id="ref60"><label>60</label><nlm-citation citation-type="web"><source>GitHub</source><access-date>2026-04-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/miye-ha/CNTRAM">https://github.com/miye-ha/CNTRAM</ext-link></comment></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Supplementary terms.</p><media xlink:href="jmir_v28i1e89850_app1.docx" xlink:title="DOCX File, 18 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Recall@k Values for Different Retrieval Window k</p><media xlink:href="jmir_v28i1e89850_app2.docx" xlink:title="DOCX File, 16 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Performance of large language models under &#x201C;No retrieval-augmented generation&#x201D; and &#x201C;Few-shot prompting&#x201D; for nursing diagnosis and intervention tasks.</p><media xlink:href="jmir_v28i1e89850_app3.docx" xlink:title="DOCX File, 19 KB"/></supplementary-material></app-group></back></article>