<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="review-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id><journal-id journal-id-type="publisher-id">jmir</journal-id><journal-id journal-id-type="index">1</journal-id><journal-title>Journal of Medical Internet Research</journal-title><abbrev-journal-title>J Med Internet Res</abbrev-journal-title><issn pub-type="epub">1438-8871</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v27i1e74177</article-id><article-id pub-id-type="doi">10.2196/74177</article-id><article-categories><subj-group subj-group-type="heading"><subject>Review</subject></subj-group></article-categories><title-group><article-title>Large Language Models in Lung Cancer: Systematic Review</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Zhong</surname><given-names>Ruikang</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Chen</surname><given-names>Siyi</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Li</surname><given-names>Zexing</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Gao</surname><given-names>Tangke</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Su</surname><given-names>Yisha</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zhang</surname><given-names>Wenzheng</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Liu</surname><given-names>Dianna</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Gao</surname><given-names>Lei</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name name-style="western"><surname>Hu</surname><given-names>Kaiwen</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib></contrib-group><aff id="aff1"><institution>Graduate School, Beijing University of Chinese Medicine</institution><addr-line>Beijing</addr-line><country>China</country></aff><aff id="aff2"><institution>Oncology Department, Dongfang Hospital, Beijing University of Chinese Medicine</institution><addr-line>No. 6, Fangxingyuan 1st District, Fengtai District</addr-line><addr-line>Beijing</addr-line><country>China</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Sarvestan</surname><given-names>Javad</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Wu</surname><given-names>Chaochen</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Vedaraju</surname><given-names>Yuvanesh</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Yueniwati</surname><given-names>Yuyun</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Kaiwen Hu, MD, Oncology Department, Dongfang Hospital, Beijing University of Chinese Medicine, No. 6, Fangxingyuan 1st District, Fengtai District, Beijing, China, 86 13911650713; <email>kaiwenh@163.com</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>30</day><month>9</month><year>2025</year></pub-date><volume>27</volume><elocation-id>e74177</elocation-id><history><date date-type="received"><day>19</day><month>03</month><year>2025</year></date><date date-type="rev-recd"><day>13</day><month>08</month><year>2025</year></date><date date-type="accepted"><day>14</day><month>08</month><year>2025</year></date></history><copyright-statement>&#x00A9;Ruikang Zhong, Siyi Chen, Zexing Li, Tangke Gao, Yisha Su, Wenzheng Zhang, Dianna Liu, Lei Gao, Kaiwen Hu. Originally published in the Journal of Medical Internet Research (<ext-link ext-link-type="uri" xlink:href="https://www.jmir.org">https://www.jmir.org</ext-link>), 30.9.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.jmir.org/">https://www.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://www.jmir.org/2025/1/e74177"/><abstract><sec><title>Background</title><p>In the era of data and intelligence, artificial intelligence has been widely applied in the medical field. As the most cutting-edge technology, the large language model (LLM) has gained popularity due to its extraordinary ability to handle complex tasks and interactive features.</p></sec><sec><title>Objective</title><p>This study aimed to systematically review current applications of LLMs in lung cancer (LC) care and evaluate their potential across the full-cycle management spectrum.</p></sec><sec sec-type="methods"><title>Methods</title><p>Following PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) guidelines, we conducted a comprehensive literature search across 6 databases up to January 1, 2025. Studies were included if they satisfied the following criteria: (1) journal articles, conference papers, and preprints; (2) studies that reported the content of LLMs in LC; (3) including original data and LC-related data presented separately; and (4) studies published in English. The exclusion criteria were as follows: (1) books and book chapters, letters, reviews, conference proceedings; (2) studies that did not report the content of LLMs in LC; and (3) no original data, and LC-related data that are not presented separately. Studies were screened independently by 2 authors (SC and ZL) and assessed for quality using Quality Assessment of Diagnostic Accuracy Studies-2, Prediction Model Risk of Bias Assessment Tool, and Risk Of Bias in Non-randomized Studies - of Interventions tools, selected based on study type. Key data items extracted included model type, application scenario, prompt method, input and output format, outcome measures, and safety considerations. Data analysis was conducted using descriptive statistics.</p></sec><sec sec-type="results"><title>Results</title><p>Out of 706 studies screened, 28 were included (published between 2023 and 2024). The ability of LLMs to automatically extract medical records, popularize general knowledge about LC, and assist clinical diagnosis and treatment has been demonstrated through the systematic review, emerging visual ability, and multimodal potential. Prompt engineering was a critical component, with varying degrees of sophistication from zero-shot to fine-tuned approaches. Quality assessments revealed overall acceptable methodological rigor but noted limitations in bias control and data security reporting.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>LLMs show considerable potential in improving LC diagnosis, communication, and decision-making. However, their responsible use requires attention to privacy, interpretability, and human oversight.</p></sec><sec><title>Trial Registration</title><p>PROSPERO CRD42024612388; https://www.crd.york.ac.uk/PROSPERO/view/CRD42024612388</p></sec></abstract><kwd-group><kwd>lung cancer</kwd><kwd>LC</kwd><kwd>large language modeling</kwd><kwd>LLM</kwd><kwd>artificial intelligence</kwd><kwd>full-cycle management</kwd><kwd>clinical practice</kwd><kwd>systematic review</kwd><kwd>diagnosis</kwd><kwd>treatment</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Lung cancer (LC) is one of the leading causes of cancer incidence and mortality worldwide [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Early detection and accurate treatment are essential to improving survival [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>], and low-dose computed tomography (CT) screening has been shown to reduce mortality [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. In recent years, integrated full-cycle management&#x2014;covering prevention, screening, diagnosis, treatment, and supportive care&#x2014;has been promoted to improve both survival and quality of life [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>]. However, this approach requires complex workflows and large-scale data processing, placing heavy demands on medical resources and personnel.</p><p>Artificial intelligence, particularly large language models (LLMs), offers a potential solution. LLMs can process complex clinical data, support decision-making, and enable personalized communication between patients and health care providers [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. At the same time, they face limitations such as bias [<xref ref-type="bibr" rid="ref12">12</xref>] and hallucinations [<xref ref-type="bibr" rid="ref13">13</xref>]. These issues highlight the need for a systematic evaluation of their role in clinical practice.</p><p>Numerous studies have been conducted on LLMs in the field of LC. Some scholars have carried out a systematic review on the potential of LLMs and natural language processing in LC diagnosis [<xref ref-type="bibr" rid="ref14">14</xref>]. However, it was limited to diagnostic applications, relied on outdated evidence, and lacked a comprehensive scope. This study aims to address these gaps by systematically reviewing the latest applications of LLMs in LC. We summarize current use cases, model types, fine-tuning strategies, limitations, and future directions. Our goal is to help clinicians and researchers better understand how to integrate LLMs into LC management while recognizing their potential and constraints.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Overview</title><p>This study was conducted in accordance with the PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) guidelines [<xref ref-type="bibr" rid="ref15">15</xref>]. The PRISMA checklist is presented in <xref ref-type="supplementary-material" rid="app2">Checklist 1</xref>.</p></sec><sec id="s2-2"><title>Eligibility Criteria</title><p>We established clear inclusion and exclusion criteria based on the research objectives, as summarized in <xref ref-type="table" rid="table1">Table 1</xref>. No time restrictions were applied during the selection of studies.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Inclusion and exclusion criteria.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Criterion</td><td align="left" valign="bottom">Inclusion</td><td align="left" valign="bottom">Exclusion</td></tr></thead><tbody><tr><td align="left" valign="top">Types of studies</td><td align="left" valign="top">Journal articles, conference papers, and preprints</td><td align="left" valign="top">Books and book chapters, letters, reviews, and conference proceedings</td></tr><tr><td align="left" valign="top">Content</td><td align="left" valign="top">Content involves LLMs<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> and LC<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top">Neither LLMs nor LC</td></tr><tr><td align="left" valign="top">Outcomes</td><td align="left" valign="top">Including original data, and LC-related data are presented separately</td><td align="left" valign="top">No original data, and LC-related data are not presented separately</td></tr><tr><td align="left" valign="top">Language</td><td align="left" valign="top">English</td><td align="left" valign="top">Non-English</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>LLM: large language model.</p></fn><fn id="table1fn2"><p><sup>b</sup>LC: lung cancer.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-3"><title>Data Sources</title><p>Eligible studies were identified by searching 6 electronic databases: PubMed, Web of Science, IEEE, Embase, Cochrane Library, and Scopus. The final search was run up to January 1, 2025.</p></sec><sec id="s2-4"><title>Search Strategy</title><p>The search strategy was structured as follows: ((&#x201C;large language model&#x201D;) OR (&#x201C;LLM&#x201D;) OR (&#x201C;ChatGPT&#x201D;) OR (&#x201C;chatGPT&#x201D;)) AND ((&#x201C;lung cancer&#x201D;) OR (&#x201C;lung tumor&#x201D;) OR (&#x201C;pulmonary ground-glass&#x201D;) OR (&#x201C;lung malignancy&#x201D;) OR (&#x201C;lung carcinoma&#x201D;) OR (&#x201C;lung metastasis&#x201D;) OR (&#x201C;lung metastatic&#x201D;) OR (&#x201C;pulmonary metastatic&#x201D;) OR (&#x201C;pulmonary metastasis&#x201D;)).</p></sec><sec id="s2-5"><title>Selection Process</title><p>EndNote X9.3.3 (build 13966; Clarivate) was used to manage references and remove duplicates. Two authors (RZ and SC) independently screened the titles and abstracts, followed by full-text screening based on the predefined inclusion and exclusion criteria. Discrepancies were resolved through discussion, with arbitration by a third author (ZL) when necessary. The consistency degree of the 2 authors was verified using the kappa consistency test.</p></sec><sec id="s2-6"><title>Data Collection Process</title><p>Two authors (RZ and SC) carried out the data collection process. All extracted data from the main text, tables, figures, and appendices were annotated using WPS Office Excel (version 12.1.0.18608; Kingsoft Office Software).</p></sec><sec id="s2-7"><title>Data Items</title><p>The data extraction form included the following items: title, first author, year of publication, study design, LLM model used, application scenario, intervention, prompt engineering approach, input and output formats, and outcome measures. The consistency rate of the 2 authors was calculated.</p></sec><sec id="s2-8"><title>Quality Appraisal</title><p>To ensure a rigorous evaluation of study quality, we adopted a mixed methods approach based on the framework by Omar and Levkovich [<xref ref-type="bibr" rid="ref16">16</xref>]. Appropriate quality assessment tools were selected based on the specific application of LLMs in each study. QUADAS-2 (Quality Assessment of Diagnostic Accuracy Studies-2) [<xref ref-type="bibr" rid="ref17">17</xref>] is a validated and widely accepted tool for evaluating the quality of diagnostic tests. For studies where LLMs were primarily applied to LC diagnosis or staging, the QUADAS-2 tool was used. PROBAST (Prediction Model Risk of Bias Assessment Tool) [<xref ref-type="bibr" rid="ref18">18</xref>] is specifically designed to assess the risk of bias in studies involving predictive modeling and was applied accordingly. The ROBINS-I (Risk Of Bias in Non-randomized Studies - of Interventions) [<xref ref-type="bibr" rid="ref19">19</xref>] tool is commonly used to assess bias in observational studies. For research on information extraction and knowledge-based tasks, these were considered observational in nature, and thus, the ROBINS-I tool was applied. Given that studies involving LLMs differ in format and content from conventional clinical trials, 2 oncology experts at the chief physician level (LG and KH) adapted the criteria of each tool accordingly to better reflect the nature and objectives of the included studies.</p><p>The quality assessment was carried out back-to-back by 2 researchers (SC and ZL) and, in the case of controversial content, by a third researcher (RZ) in order to deliberate jointly on the decision. The final results are reviewed by 2 experts (LG and KH). The consistency degree of the 2 authors was verified using the kappa consistency test.</p></sec><sec id="s2-9"><title>Synthesis Methods</title><p>Meta-analysis was not planned in this review. We conducted data analysis using descriptive statistics. Frequencies were used to summarize the application scenarios, prompt strategies, and other relevant characteristics of LLMs. Narrative synthesis was conducted due to the heterogeneity in the specified aims and methodologies across the included studies. We primarily used WPS and the BioRender website for figure generation. We used IBM SPSS (version 29.0.2.0) to calculate the kappa value.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Search Results</title><p>In this study, a total of 706 studies were retrieved, and 28 studies [<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref47">47</xref>] were finally included after screening. The kappa values of the 2 researchers during the screening stage were 0.87, indicating good consistency. The specific screening process is presented in <xref ref-type="fig" rid="figure1">Figure 1</xref>.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Study flowchart (produced according to the PRISMA [Preferred Reporting Items for Systematic Reviews and Meta-Analyses] 2020 flow diagram).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e74177_fig01.png"/></fig></sec><sec id="s3-2"><title>Basic Information of Included Sources</title><p>During the data extraction stage, the consistency rate of the 2 authors reached 0.97. All included studies were published between 2023 and 2024, with 7 published in 2023 [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref40">40</xref>] and 21 in 2024 [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref47">47</xref>]. Of these, 13 studies originated from the United States [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref23">23</xref>-<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref46">46</xref>], followed by 3 each from South Korea [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref44">44</xref>], Germany [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref34">34</xref>], and China [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref39">39</xref>]. The remaining studies were conducted in India [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref47">47</xref>], Turkey [<xref ref-type="bibr" rid="ref28">28</xref>], Japan [<xref ref-type="bibr" rid="ref37">37</xref>], Greece [<xref ref-type="bibr" rid="ref40">40</xref>], and the Netherlands [<xref ref-type="bibr" rid="ref41">41</xref>]. Publication types included 5 conference papers [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref47">47</xref>] and 4 preprints [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref39">39</xref>]. The most commonly used LC type was non&#x2013;small cell lung cancer (NSCLC). Most studies focused on knowledge-based question answering, information extraction, and diagnostic support. The LLMs used varied widely, with frequent use of OpenAI&#x2019;s GPT-3.5, GPT-4, and GPT-4V, Meta AI&#x2019;s LLaMA-2, and Google AI&#x2019;s Bard. A summary of these details is provided in <xref ref-type="table" rid="table2">Table 2</xref>.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Summary of included sources.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Study</td><td align="left" valign="bottom">Title</td><td align="left" valign="bottom">Country</td><td align="left" valign="bottom">Device</td><td align="left" valign="bottom">Best performance</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="5">Information extraction</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Bhattarai et al [<xref ref-type="bibr" rid="ref20">20</xref>]</td><td align="left" valign="top">Leveraging GPT-4 for identifying cancer phenotypes in electronic health records: a performance comparison between GPT-4, GPT-3.5-turbo, Flan-T5, Llama-3-8B, and spaCy&#x2019;s rule-based and machine learning&#x2013;based methods</td><td align="left" valign="top">United States</td><td align="left" valign="top">GPT-4, GPT-3.5-turbo, Flan-T5, Llama-3-8B, spaCy</td><td align="left" valign="top">GPT-4</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Fink et al [<xref ref-type="bibr" rid="ref21">21</xref>]</td><td align="left" valign="top">Potential of ChatGPT and GPT-4 for data mining of free-text CT<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup> reports on lung cancer</td><td align="left" valign="top">Germany</td><td align="left" valign="top">ChatGPT, GPT-4</td><td align="left" valign="top">GPT-4</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hu et al [<xref ref-type="bibr" rid="ref22">22</xref>]</td><td align="left" valign="top">Zero-shot information extraction from radiological reports using ChatGPT</td><td align="left" valign="top">China</td><td align="left" valign="top">ChatGPT</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Naik et al [<xref ref-type="bibr" rid="ref23">23</xref>]</td><td align="left" valign="top">Applying large language models for causal structure learning in non&#x2013;small cell lung cancer</td><td align="left" valign="top">United States</td><td align="left" valign="top">NR<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup></td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Niu et al [<xref ref-type="bibr" rid="ref24">24</xref>]</td><td align="left" valign="top">Cross-institutional structured radiology reporting for lung cancer screening using a dynamic template-constrained large language model</td><td align="left" valign="top">United States</td><td align="left" valign="top">Llama-3.1 (8B, 70B, 405B), Qwen-2 (72B), Mistral-Large (123B)</td><td align="left" valign="top">Llama-3.1 (8B, 70B, 405B)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lee et al [<xref ref-type="bibr" rid="ref25">25</xref>]</td><td align="left" valign="top">SEETrials: leveraging large language models for safety and efficacy extraction in oncology clinical trials</td><td align="left" valign="top">United States</td><td align="left" valign="top">GPT-4</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lyu et al [<xref ref-type="bibr" rid="ref26">26</xref>]</td><td align="left" valign="top">Translating radiology reports into plain language using ChatGPT and GPT-4 with prompt learning: results, limitations, and potential</td><td align="left" valign="top">United States</td><td align="left" valign="top">ChatGPT</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top" colspan="5">Knowledge-based question and answer evaluation</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Ferrari-Light et al [<xref ref-type="bibr" rid="ref27">27</xref>]</td><td align="left" valign="top">Evaluating ChatGPT as a patient resource for frequently asked questions about lung cancer surgery&#x2013;a pilot study</td><td align="left" valign="top">United States</td><td align="left" valign="top">GPT-3.5</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Gencer [<xref ref-type="bibr" rid="ref28">28</xref>]</td><td align="left" valign="top">Readability analysis of ChatGPT&#x2019;s responses on lung cancer</td><td align="left" valign="top">Turkey</td><td align="left" valign="top">GPT-3.5-turbo</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Haver et al [<xref ref-type="bibr" rid="ref29">29</xref>]</td><td align="left" valign="top">Use of ChatGPT, GPT-4, and Bard to improve readability of ChatGPT&#x2019;s answers to common questions about lung cancer and lung cancer screening</td><td align="left" valign="top">United States</td><td align="left" valign="top">ChatGPT, GPT 4, Bard</td><td align="left" valign="top">Bard</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Janopaul-Naylor et al [<xref ref-type="bibr" rid="ref30">30</xref>]</td><td align="left" valign="top">Physician assessment of ChatGPT and Bing answers to American Cancer Society&#x2019;s questions to ask about your cancer</td><td align="left" valign="top">United States</td><td align="left" valign="top">GPT-3.5, Bing AI</td><td align="left" valign="top">GPT-3.5</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Rogasch et al [<xref ref-type="bibr" rid="ref31">31</xref>]</td><td align="left" valign="top">ChatGPT: can you prepare my patients for [18F]FDG PET/CT and explain my reports?</td><td align="left" valign="top">Germany</td><td align="left" valign="top">ChatGPT</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Rahsepar et al [<xref ref-type="bibr" rid="ref32">32</xref>]</td><td align="left" valign="top">How AI responds to common lung cancer questions: ChatGPT versus Google Bard</td><td align="left" valign="top">United States</td><td align="left" valign="top">GPT-3.5, Google Bard experimental version</td><td align="left" valign="top">GPT-3.5</td></tr><tr><td align="left" valign="top" colspan="5">Auxiliary diagnosis</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Cho et al [<xref ref-type="bibr" rid="ref33">33</xref>]</td><td align="left" valign="top">Extracting lung cancer staging descriptors from pathology reports: a generative language model approach</td><td align="left" valign="top">Korea</td><td align="left" valign="top">Llama-2-7B, Mistral-7B, Deductive Llama-2-7B (Orca-2), Deductive Mistral-7B (Dolphin), AWS Llama-2-70B, AWS Titan express</td><td align="left" valign="top">Deductive Mistral-7B</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Dehdab et al [<xref ref-type="bibr" rid="ref34">34</xref>]</td><td align="left" valign="top">Evaluating ChatGPT-4V in chest CT diagnostics: a critical image interpretation assessment</td><td align="left" valign="top">Germany</td><td align="left" valign="top">GPT-4V</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hu et al [<xref ref-type="bibr" rid="ref35">35</xref>]</td><td align="left" valign="top">The power of combining data and knowledge: GPT-4o is an effective interpreter of machine learning models in predicting lymph node metastasis of lung cancer</td><td align="left" valign="top">China</td><td align="left" valign="top">GPT-4</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Huang et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td><td align="left" valign="top">A critical assessment of using ChatGPT for extracting structured data from clinical notes</td><td align="left" valign="top">United States</td><td align="left" valign="top">GPT-3.5-Turbo-16k</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Yasaka et al [<xref ref-type="bibr" rid="ref37">37</xref>]</td><td align="left" valign="top">Fine-tuned large language model for extracting patients on pretreatment for lung cancer from a picture archiving and communication system based on radiological reports</td><td align="left" valign="top">Japan</td><td align="left" valign="top">Transformers Japanese model</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Vallabhaneni et al [<xref ref-type="bibr" rid="ref38">38</xref>]</td><td align="left" valign="top">Improved lung cancer detection through use of large language systems with graphical attributes</td><td align="left" valign="top">India</td><td align="left" valign="top">NR</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Qu et al [<xref ref-type="bibr" rid="ref39">39</xref>]</td><td align="left" valign="top">The rise of AI language pathologists: exploring two-level prompt learning for few-shot weakly-supervised whole slide image classification</td><td align="left" valign="top">China</td><td align="left" valign="top">GPT-4</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">Panagoulias</named-content> et al [<xref ref-type="bibr" rid="ref40">40</xref>]</td><td align="left" valign="top">Evaluation of ChatGPT-supported diagnosis, staging and treatment planning for the case of lung cancer</td><td align="left" valign="top">Greece</td><td align="left" valign="top">ChatGPT</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mithun et al [<xref ref-type="bibr" rid="ref41">41</xref>]</td><td align="left" valign="top">Transfer learning with BERT and ClinicalBERT models for multiclass classification of radiology imaging reports</td><td align="left" valign="top">Netherlands</td><td align="left" valign="top">BERT, ClinicalBERT</td><td align="left" valign="top">ClinicalBERT</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lee et al [<xref ref-type="bibr" rid="ref42">42</xref>]</td><td align="left" valign="top">Lung cancer staging using chest CT and FDG PET/CT free-text reports: comparison among three ChatGPT large-language models and six human readers of varying experience</td><td align="left" valign="top">Korea</td><td align="left" valign="top">GPT-4o, GPT-4, GPT-3.5</td><td align="left" valign="top">GPT-4o</td></tr><tr><td align="left" valign="top" colspan="5">Treatment decision-making</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Dong et al [<xref ref-type="bibr" rid="ref43">43</xref>]</td><td align="left" valign="top">Large-language-model empowered 3D dose prediction for intensity-modulated radiotherapy</td><td align="left" valign="top">United States</td><td align="left" valign="top">Llama-2</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Jeong et al [<xref ref-type="bibr" rid="ref44">44</xref>]</td><td align="left" valign="top">The prediction of stress in radiation therapy: integrating artificial intelligence with biological signals</td><td align="left" valign="top">Korea</td><td align="left" valign="top">Decision tree, random forest, support vector machine, LSTM<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup>, GPT-4, GPT-3.5</td><td align="left" valign="top">LSTM (limited information); GPT-4 (complex and diverse information)</td></tr><tr><td align="left" valign="top" colspan="5">Aided nursing</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Dos Santos et al [<xref ref-type="bibr" rid="ref45">45</xref>]</td><td align="left" valign="top">An example of leveraging AI for documentation: ChatGPT-generated nursing care plan for an older adult with lung cancer</td><td align="left" valign="top">United States</td><td align="left" valign="top">ChatGPT</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top" colspan="5">Scientific research</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Wang et al [<xref ref-type="bibr" rid="ref46">46</xref>]</td><td align="left" valign="top">Scientific figures interpreted by ChatGPT: strengths in plot recognition and limits in color perception</td><td align="left" valign="top">United States</td><td align="left" valign="top">GPT-4V</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Devi et al [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">Automating clinical trial eligibility screening: quantitative analysis of GPT models versus human expertise</td><td align="left" valign="top">India</td><td align="left" valign="top">GPT-3.5-turbo</td><td align="left" valign="top">&#x2014;</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>CT: computed tomography.</p></fn><fn id="table2fn2"><p><sup>b</sup>Not available.</p></fn><fn id="table2fn3"><p><sup>c</sup>NR: not reported.</p></fn><fn id="table2fn4"><p><sup>d</sup>LSTM: long short-term memory.</p></fn></table-wrap-foot></table-wrap><p>Notably, many studies used multiple LLMs or conducted comparative evaluations, and some explored multimodal capabilities such as image interpretation. The best-performing models identified in these comparative studies are summarized in <xref ref-type="table" rid="table2">Table 2</xref>. The results indicate that the ChatGPT (OpenAI) series models are the most comprehensive and widely applicable, exhibiting strong performance in both information extraction and auxiliary diagnosis, highlighting the improvements achieved through version updates. However, for a limited number of tasks or under constrained information conditions, lightweight models, such as Bard or architectures like long short-term memory networks may perform better. In addition, LLMs specialized in the medical domain, such as Deductive Mistral-7B and ClinicalBERT, demonstrate superior performance compared with general-purpose pretrained models.</p></sec><sec id="s3-3"><title>Prompt Engineering and Model Training</title><p>Prompt engineering plays a critical role in the development and application of LLMs and is a frequent topic of discussion in related studies. Therefore, we synthesized and summarized the prompt engineering strategies, model inputs and outputs, and evaluation metrics used in the included studies (<xref ref-type="table" rid="table3">Table 3</xref>). In total, 12 (43%) studies [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref47">47</xref>] did not explicitly describe their prompting strategies, which were generally basic queries, primarily intended for educational use. Furthermore, 16 (57%) studies [<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref46">46</xref>] clearly described their prompting methods. These methods included prompt templates, instructional prompts, zero-shot or few-shot learning, and other fine-tuning techniques. Regarding the types of training data, a total of 22 (79%) studies [<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref46">46</xref>] focused on text, 3 (11%) studies [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref43">43</xref>] on images, and 3 (11%) studies [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref46">46</xref>] on a combination of images and text. Outcome metrics commonly included confusion matrices, rating scales, and comparisons against gold-standard references or expert consensus. Some studies also reported on the time efficiency and cost-effectiveness of LLM-generated outputs.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Prompt engineering and model training.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Study</td><td align="left" valign="bottom">Prompt method or content</td><td align="left" valign="bottom">Model input</td><td align="left" valign="bottom">Model output</td><td align="left" valign="bottom">Outcome indicators</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="5">Information extraction</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Bhattarai et al [<xref ref-type="bibr" rid="ref20">20</xref>]</td><td align="left" valign="top">Zero-shot prompt</td><td align="left" valign="top">Segmented text and zero-shot prompt</td><td align="left" valign="top">Phenotypic information (cancer staging, cancer treatment), evidence of cancer recurrence, and organs affected by cancer recurrence</td><td align="left" valign="top">Accuracy, recall rate, <italic>F</italic><sub>1</sub>-score, generation time, operating costs</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Fink et al [<xref ref-type="bibr" rid="ref21">21</xref>]</td><td align="left" valign="top">25 original lung cancer CT<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup> reports used to prompt training</td><td align="left" valign="top">Original lung cancer CT reports</td><td align="left" valign="top">Tumor information includes tumor lesions, metastatic sites, tumor impression assessment (deterioration, stability, improvement), and interpretation</td><td align="left" valign="top">McNemar test, accuracy, 5-point Likert scale</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hu et al [<xref ref-type="bibr" rid="ref22">22</xref>]</td><td align="left" valign="top">Prompt template, including an information extraction command, a question form, extraction requirements, and some relevant medical knowledge</td><td align="left" valign="top">CT reports and prompt template</td><td align="left" valign="top">Answers to the question form</td><td align="left" valign="top">Accuracy, precision, recall rate, and <italic>F</italic><sub>1</sub>-score</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Naik et al [<xref ref-type="bibr" rid="ref23">23</xref>]</td><td align="left" valign="top">Code interpreter plugin (developed by OpenAI)</td><td align="left" valign="top">Electronic medical records, genomic data</td><td align="left" valign="top">Directed acyclic graph</td><td align="left" valign="top">Bdeu score</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Niu et al [<xref ref-type="bibr" rid="ref24">24</xref>]</td><td align="left" valign="top">Not mentioned</td><td align="left" valign="top">CT imaging</td><td align="left" valign="top">Standardized and structured radiological reports</td><td align="left" valign="top"><italic>F</italic><sub>1</sub>-score, CI, McNemar test, and <italic>z</italic> test</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lee et al [<xref ref-type="bibr" rid="ref25">25</xref>]</td><td align="left" valign="top">Prompt templates</td><td align="left" valign="top">Journal abstract</td><td align="left" valign="top">Details of clinical trials in the article</td><td align="left" valign="top">Accuracy, recall rate, <italic>F</italic><sub>1</sub>-score</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lyu et al [<xref ref-type="bibr" rid="ref26">26</xref>]</td><td align="left" valign="top">Instruction</td><td align="left" valign="top">Radiological reports</td><td align="left" valign="top">Report translation and suggestions</td><td align="left" valign="top">Self score, report completeness and accuracy</td></tr><tr><td align="left" valign="top" colspan="5">Knowledge-based question and answer evaluation</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Ferrari-Light et al [<xref ref-type="bibr" rid="ref27">27</xref>]</td><td align="left" valign="top">Not mentioned</td><td align="left" valign="top">Questions</td><td align="left" valign="top">Answers</td><td align="left" valign="top">5-point Likert scale</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Gencer [<xref ref-type="bibr" rid="ref28">28</xref>]</td><td align="left" valign="top">Not mentioned</td><td align="left" valign="top">Questions</td><td align="left" valign="top">Answers</td><td align="left" valign="top">Flesch Reading Ease (FRE) formula, Flesch-Kincaid Grade level (FKGL), Gunning FOG formula, SMOG index, Automated readability index (ARI), Coleman-Liau index, Linsear write formula, Dale-Chall readability score, Spache readability formula</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Haver et al [<xref ref-type="bibr" rid="ref29">29</xref>]</td><td align="left" valign="top">Not mentioned</td><td align="left" valign="top">Questions</td><td align="left" valign="top">Baseline responses and simplified responses</td><td align="left" valign="top">Reading Ease Score, readability, clinical appropriateness</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Janopaul-Naylor et al [<xref ref-type="bibr" rid="ref30">30</xref>]</td><td align="left" valign="top">Not mentioned</td><td align="left" valign="top">Questions</td><td align="left" valign="top">Answers</td><td align="left" valign="top">Self rating</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Rogasch et al [<xref ref-type="bibr" rid="ref31">31</xref>]</td><td align="left" valign="top">Regeneration-response function repeated three times for training</td><td align="left" valign="top">Questions</td><td align="left" valign="top">Answers</td><td align="left" valign="top">Self rating</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Rahsepar et al [<xref ref-type="bibr" rid="ref32">32</xref>]</td><td align="left" valign="top">Not mentioned</td><td align="left" valign="top">Questions</td><td align="left" valign="top">Answers</td><td align="left" valign="top">Accuracy, consistency</td></tr><tr><td align="left" valign="top" colspan="5">Auxiliary diagnosis</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Cho et al [<xref ref-type="bibr" rid="ref33">33</xref>]</td><td align="left" valign="top">Morphology group</td><td align="left" valign="top">Segmented pathological report</td><td align="left" valign="top">42 lung cancer staging descriptors; tumor node classification</td><td align="left" valign="top">Macro <italic>F</italic><sub>1</sub>-score, accurate matching ratio, accuracy</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Dehdab et al [<xref ref-type="bibr" rid="ref34">34</xref>]</td><td align="left" valign="top">Not mentioned</td><td align="left" valign="top">CT images of lung window</td><td align="left" valign="top">Diagnosis of lung cancer (yes or no)</td><td align="left" valign="top">Accuracy, sensitivity, specificity</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hu et al [<xref ref-type="bibr" rid="ref35">35</xref>]</td><td align="left" valign="top">Prompt templates, including roles, tasks, patient data, machine learning model results and instructions</td><td align="left" valign="top">Prompt templates</td><td align="left" valign="top">Prediction results of lymph node metastasis in lung cancer</td><td align="left" valign="top">AUC<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup>, AP (average precision of 3 repetitions)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Huang et al [<xref ref-type="bibr" rid="ref36">36</xref>]</td><td align="left" valign="top">Prompt templates, including clinical staging introduction and instructions</td><td align="left" valign="top">Pathology reports and prompt templates</td><td align="left" valign="top">Tumor size, tumor characteristics, lymph node involvement, histological classification, clinical staging</td><td align="left" valign="top">Accuracy, average precision, <italic>F</italic><sub>1</sub>-score, Kappa, recall rate</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Yasaka et al [<xref ref-type="bibr" rid="ref37">37</xref>]</td><td align="left" valign="top">Not mentioned</td><td align="left" valign="top">Clinical indications and diagnosis of radiological reports</td><td align="left" valign="top">Patient grouping (Group 0: no lung cancer, Group 1: lung cancer pre-treatment present, Group 2: after lung cancer treatment, Group 3: planned radiotherapy)</td><td align="left" valign="top">Overall accuracy, sensitivity, consistency, AUC, classification time</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Vallabhaneni et al [<xref ref-type="bibr" rid="ref38">38</xref>]</td><td align="left" valign="top">Not mentioned</td><td align="left" valign="top">Images, symptoms, clinical prescriptions</td><td align="left" valign="top">Diagnosis of lung cancer (yes or no)</td><td align="left" valign="top">Accuracy, recall rate, <italic>F</italic><sub>1</sub>-score, AUC</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Qu et al [<xref ref-type="bibr" rid="ref39">39</xref>]</td><td align="left" valign="top">Guide GPT-4 to visually describe complex medical concepts</td><td align="left" valign="top">Questions (text)</td><td align="left" valign="top">Answers</td><td align="left" valign="top">AUC</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Panagoulias et al [<xref ref-type="bibr" rid="ref40">40</xref>]</td><td align="left" valign="top">Build and refine prompts based on the returned answers</td><td align="left" valign="top">Symptom description</td><td align="left" valign="top">Diagnosis and treatment plan for lung cancer</td><td align="left" valign="top">Self-drafted standards</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mithun et al [<xref ref-type="bibr" rid="ref41">41</xref>]</td><td align="left" valign="top">Not mentioned</td><td align="left" valign="top">Radiological reports</td><td align="left" valign="top">Classification results of lung cancer</td><td align="left" valign="top">AUC, <italic>F</italic><sub>1</sub>-score, accuracy, recall rate, precision</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lee et al [<xref ref-type="bibr" rid="ref42">42</xref>]</td><td align="left" valign="top">Instruction</td><td align="left" valign="top">Chest CT and FDG PET<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup> or CT reports</td><td align="left" valign="top">The maximum size of the primary tumor, local invasion, satellite lesions, metastatic lymph nodes, intrathoracic and extrathoracic metastases, and TNM<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup> staging diagnosis</td><td align="left" valign="top">Accuracy, recall rate, <italic>F</italic><sub>1</sub>-score, average task completion time, misreading rate</td></tr><tr><td align="left" valign="top" colspan="5">Treatment decision-making</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Dong et al [<xref ref-type="bibr" rid="ref43">43</xref>]</td><td align="left" valign="top">Clinical physician commands (findings, treatment goals, and precautions)</td><td align="left" valign="top">CT images</td><td align="left" valign="top">DVH (Radiation dose volume histogram)</td><td align="left" valign="top">Mean absolute error (MAE) of Dmax, Dmean, D95, and D1 between actual and predicted plans</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Jeong et al [<xref ref-type="bibr" rid="ref44">44</xref>]</td><td align="left" valign="top">Not mentioned</td><td align="left" valign="top">Biological signals before radiotherapy and instructions</td><td align="left" valign="top">Prediction results of biological signals and stress response during radiotherapy</td><td align="left" valign="top">Accuracy, recall rate, precision, <italic>F</italic><sub>1</sub>-score</td></tr><tr><td align="left" valign="top" colspan="5">Aided nursing</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Dos Santos et al [<xref ref-type="bibr" rid="ref45">45</xref>]</td><td align="left" valign="top">Patient&#x2019;s needs framework (Situation or Background, Physical, Safety, Psychosocial, Spiritual or Culture, Nursing Recommendation)</td><td align="left" valign="top">Medical records, needs framework, problem prompts</td><td align="left" valign="top">Care plan</td><td align="left" valign="top">The number of items that match the gold standard (16 tags including NANDA, NOC, and NIC)</td></tr><tr><td align="left" valign="top" colspan="5">Scientific research</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Wang et al [<xref ref-type="bibr" rid="ref46">46</xref>]</td><td align="left" valign="top">Instruction</td><td align="left" valign="top">K-M<sup><xref ref-type="table-fn" rid="table3fn5">e</xref></sup> curves generated based on gene expression data and survival information</td><td align="left" valign="top">Analysis and Interpretation of K-M curves</td><td align="left" valign="top">Overall accuracy, Accuracy under each category</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Devi et al [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">Not mentioned</td><td align="left" valign="top">Unprocessed raw dataset</td><td align="left" valign="top">Whether the patient is qualified for enrollment (yes or no)</td><td align="left" valign="top">Accuracy compared with manual classification</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>CT: computed tomography.</p></fn><fn id="table3fn2"><p><sup>b</sup>AUC: area under the curve.</p></fn><fn id="table3fn3"><p><sup>c</sup>FDG PET: Fluorodeoxyglucose positron emission tomography.</p></fn><fn id="table3fn4"><p><sup>d</sup>TNM: tumor, nodes, metastasis.</p></fn><fn id="table3fn5"><p><sup>e</sup>K-M: Kaplan Meier.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-4"><title>Quality Appraisal</title><p>The included studies were categorized based on their research objectives, and quality was assessed using corresponding appraisal tools (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The kappa values of the 2 researchers were 0.84. Furthermore, 3 predictive modeling studies [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>] were evaluated using the PROBAST tool (<xref ref-type="fig" rid="figure2">Figure 2A</xref>). These studies showed low risk of bias regarding data sources, populations, and methodologies but exhibited a potentially high risk in predictor and outcome domains. In total, 10 diagnostic studies [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>-<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref47">47</xref>] were assessed using QUADAS-2 (<xref ref-type="fig" rid="figure2">Figure 2B</xref>). While most demonstrated good applicability, the overall risk of bias remained unclear. Furthermore, 16 intervention studies [<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref46">46</xref>] were appraised using the ROBINS-I tool (<xref ref-type="fig" rid="figure2">Figure 2C</xref>), showing low risk of bias in participant selection and intervention assignment, but unclear or high risk in other domains. Among them, 29% (18/63) of conference papers and preprints have a high-risk or unclear bias risk, while 26% (34/133) of journal papers have a high risk or unclear bias risk.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>(A) The quality appraisal for 3 predictive studies with PROBAST (Prediction model Risk Of Bias Assessment Tool). (B) The quality appraisal for 9 diagnostic studies with QUADAS-2 (Quality Assessment of Diagnostic Accuracy Studies-2). (C) The quality appraisal for 16 intervention trials with ROBINS-I (Risk Of Bias In Non-randomized Studies - of Interventions).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e74177_fig02.png"/></fig></sec><sec id="s3-5"><title>Other Aspects</title><p>In addition, we examined whether the included studies reported human oversight, addressed safety considerations, and acknowledged limitations. In total, 26 (93%) studies [<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref47">47</xref>] reported human involvement in system design, operation, or evaluation. Only 6 (21%) studies [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref43">43</xref>] explicitly addressed issues related to information security or data privacy. Furthermore, 20 (71%) studies [<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref37">37</xref>-<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref47">47</xref>] clearly stated their limitations.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>Through a systematic review of 28 studies [<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref47">47</xref>], we identified 7 primary application domains of LLMs in LC: auxiliary diagnosis, information extraction, question answering, scientific research, medical education, nursing support, and treatment decision-making (<xref ref-type="fig" rid="figure3">Figure 3</xref>). These domains often overlap in real-world practice&#x2014;for instance, information extraction frequently supports diagnostic processes, while question-answering is commonly applied in science communication and patient education (<xref ref-type="table" rid="table2">Table 2</xref>).</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Applications of large language models in lung cancer. LLM: large language model.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e74177_fig03.png"/></fig></sec><sec id="s4-2"><title>Applications of LLMs in LC</title><p>LLMs can extract clinical features by applying natural language processing methods. Therefore, many studies have used LLMs to extract and analyze information from electronic medical records [<xref ref-type="bibr" rid="ref48">48</xref>], CT reports [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>], and pathological reports [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref36">36</xref>] related to LC. This not only enables the diagnosis of clinical staging, histological type, lung-RADS (Reporting and Data System) score, and metastasis sites of LC, but also leverages their reasoning ability for diagnosis and prediction, such as lymph node metastasis [<xref ref-type="bibr" rid="ref35">35</xref>] and malignancy degree of lung nodules [<xref ref-type="bibr" rid="ref49">49</xref>]. This highlights the potential of LLMs in LC diagnosis, especially for early screening. Early diagnosis of LC can effectively improve survival rates [<xref ref-type="bibr" rid="ref50">50</xref>], and mass LC screening achieves a high detection rate of early-stage LC [<xref ref-type="bibr" rid="ref51">51</xref>], but it is time-consuming and labor-intensive. Ding et al [<xref ref-type="bibr" rid="ref52">52</xref>] applied ChatGPT to automatically generate medical records during lung nodule screening sessions and integrated it into a WeChat (Tencent Holdings Limited) applet to streamline the consultation process. Singh et al [<xref ref-type="bibr" rid="ref53">53</xref>] applied ChatGPT and Gemini (Google AI) to generate lung-RADS scores based on low-dose CT reports for LC screening, achieving up to 83.6% accuracy. A systematic review of LLMs in gastroenterology [<xref ref-type="bibr" rid="ref54">54</xref>] similarly demonstrated the potential applications of LLMs in gastrointestinal endoscopy and the screening of precancerous lesions. Although LLMs still face challenges, such as insufficient extraction performance for complex tasks and hallucinations [<xref ref-type="bibr" rid="ref55">55</xref>], the results of the study by Jong et al [<xref ref-type="bibr" rid="ref42">42</xref>] also indicate that using LLMs in place of medical professionals for LC staging is not currently supported. However, with ongoing updates to training data and continuous upgrading and optimization of LLMs, we remain optimistic about their future performance in assisting with LC diagnosis and early screening.</p><p>Given the interactive nature and vast data reserves of LLMs, many studies have evaluated their application in knowledge question answering [<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref32">32</xref>]. They have been widely applied in disseminating general knowledge about LC. With the refinement and diversification of training data and the development of multimodal large models, LLMs have shown improved capabilities in processing visual information [<xref ref-type="bibr" rid="ref56">56</xref>]. Under carefully designed prompts and instructions, several studies have found that LLMs can perform preliminary analyses of medical images and textual data and, within controlled research settings, offer diagnostic and therapeutic suggestions for LC. Examples include providing initial recommendations for subsequent treatment options in newly diagnosed or suspected patients with NSCLC [<xref ref-type="bibr" rid="ref57">57</xref>], generating more detailed chemotherapy [<xref ref-type="bibr" rid="ref58">58</xref>] or radiotherapy [<xref ref-type="bibr" rid="ref59">59</xref>] plans, and predicting outcome indicators such as overall survival [<xref ref-type="bibr" rid="ref60">60</xref>] and radiotherapy-induced stress responses [<xref ref-type="bibr" rid="ref44">44</xref>], thereby assisting treatment and nursing decision-making in research contexts [<xref ref-type="bibr" rid="ref45">45</xref>]. Furthermore, LLMs pretrained on multilingual corpora have demonstrated potential in transcribing or translating LC radiology reports [<xref ref-type="bibr" rid="ref61">61</xref>] and surgical records [<xref ref-type="bibr" rid="ref62">62</xref>] to support multicenter clinical research. It should be noted, however, that most existing evidence is derived from retrospective analyses or small-sample, single-center studies. Robust prospective, multicenter clinical validation remains lacking, and systematic assessments of model interpretability, bias, and safety are still insufficient. Therefore, the reliability and generalizability of these methods in routine clinical practice require further confirmation.</p><p>The natural language processing and named entity recognition capabilities of LLMs can not only benefit clinicians and patients in clinical practice but also improve researchers&#x2019; efficiency. Devi et al [<xref ref-type="bibr" rid="ref47">47</xref>] used GPT-3.5-turbo to classify patients with NSCLC based on pathological reports to determine their eligibility for clinical trials, assisting researchers with eligibility screening. Kyeryoung et al [<xref ref-type="bibr" rid="ref25">25</xref>] used GPT-4 to extract safety and efficacy information from clinical trial abstracts and convert it into computable data for comparative analysis across large clinical trial datasets. Liu et al [<xref ref-type="bibr" rid="ref63">63</xref>] used LLaMA 3.1 (Meta AI) to generate clinical trial annotations, enabling oncologists to stay fully updated with the latest oncology data presented at medical conferences and in journal publications. Similarly, Yuan et al [<xref ref-type="bibr" rid="ref64">64</xref>] constructed and evaluated 3 machine learning models for predicting LC survival using an LLM-based advanced data analysis approach, making advanced analytics accessible to nontechnical health care professionals.</p><p>From the above, it is evident that the current applications of LLMs in LC span multiple stages of care, from early screening and diagnosis to treatment planning, patient follow-up, and research support. However, their maturity, evidence base, and clinical readiness vary substantially. Diagnostic and screening tools are the most developed, yet most rely on retrospective datasets and single-center studies, with limited prospective, multicenter clinical validation. Similarly, treatment planning applications show promise in integrating patient-specific data with clinical guidelines, but they also lack large-scale, prospective evaluations to confirm safety, effectiveness, and adaptability to evolving oncology standards. Patient follow-up and supportive care applications are even less developed, despite their potential to improve adherence, symptom management, and long-term quality of life. These stages are often complex due to diverse patient needs, variable follow-up schedules, and sensitive data management requirements, which may explain their slower technological adoption. Research-support tools, such as automated trial eligibility screening or survival prediction, demonstrate potential for improving efficiency, but their accuracy and reproducibility in real-world practice remain uncertain.</p><p>Based on these observations, we identify 3 research priorities. First, rigorous prospective, multicenter clinical validation of both diagnostic or screening and treatment planning applications to ensure generalizability and safety. Second, targeted development of patient follow-up and supportive care applications to address gaps in long-term management and patient engagement. Third, improvement of model interpretability, bias mitigation, and integration strategies to enable safe deployment across diverse health care systems. Addressing these gaps will be essential for the effective integration of LLMs into full-cycle LC management.</p></sec><sec id="s4-3"><title>Limitations of LLMs and Future Directions in LC</title><p>Clinical decision-making for LC in practice is driven by multimodal data, including clinical notes, radiological images, and pathological features. This implies that artificial intelligence tools capable of effectively integrating multimodal data hold significant potential for advancing clinical treatment of LC [<xref ref-type="bibr" rid="ref65">65</xref>]. However, the research reviewed in this article still primarily focuses on text processing. Although efforts have been made to explore other data modalities, including CT images [<xref ref-type="bibr" rid="ref34">34</xref>], pathological images [<xref ref-type="bibr" rid="ref39">39</xref>], and bioinformatics data [<xref ref-type="bibr" rid="ref46">46</xref>], the accuracy of their outputs has yet to match that of text-based outputs. Furthermore, studies indicate that deep learning models specialized in image processing, such as Convolutional Neural Networks, outperform LLMs in classifying LC cytology images [<xref ref-type="bibr" rid="ref66">66</xref>]. Therefore, researchers tend to combine LLMs with other deep learning models for multimodal data analysis [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]. Nevertheless, the development and advancement of multimodal LLMs remain a key trend. Currently, OpenAI has taken the lead by launching ChatGPT-4o and ChatGPT-4V, spearheading the application boom of multimodal LLMs. In the future, LLMs are expected to overcome single-modality limitations on a large scale and enhance accurate diagnosis and treatment of LC by integrating multimodal reasoning capabilities across medical images, genomic data, biological molecular information, and even audio and video.</p><p>Existing research on LC predominantly uses general LLMs, such as ChatGPT and LLAMA-2, which are trained on public databases and experience slow knowledge base updates. These models may have gaps in domain-specific LC knowledge, and their outputs are prone to hallucinations and insufficient citations [<xref ref-type="bibr" rid="ref67">67</xref>]. In recent years, many large models targeting specific tasks within clinical specialties have also emerged. For example, Med-PaLM 2 [<xref ref-type="bibr" rid="ref68">68</xref>], which excels at lengthy medical question-answering; BioBERT [<xref ref-type="bibr" rid="ref69">69</xref>], which specializes in biomedical texts; and ClinicalBERT [<xref ref-type="bibr" rid="ref70">70</xref>], which focuses on clinical texts. However, studies have found that their performance on cardiac surgery knowledge quizzes [<xref ref-type="bibr" rid="ref71">71</xref>] and precision LC treatment plans [<xref ref-type="bibr" rid="ref72">72</xref>] is inferior to that of general LLMs with larger training parameter counts. Retrieval-augmented generation (RAG), a cutting-edge technology in large models, can reference reliable external knowledge (REK) to generate answers or content, enable real-time knowledge updates, and offer strong interpretability and customization capabilities [<xref ref-type="bibr" rid="ref73">73</xref>]. Combining this technology with general large-scale models has resulted in more satisfactory outcomes. Built on Google&#x2019;s Gemini Pro LLM, MEREDITH uses RAG and chain-of-thought reasoning. MEREDITH was enhanced to incorporate clinical studies on drug response within specific tumor types, trial databases, drug approval status, and oncologic guidelines. The precise treatment recommendations it provides for tumors closely align with expert advice [<xref ref-type="bibr" rid="ref74">74</xref>]. Tozuka et al [<xref ref-type="bibr" rid="ref75">75</xref>] summarized the current LC staging guidelines in Japan and supplied these as REK to NotebookLM, a RAG-equipped LLM. NotebookLM achieved 86% diagnostic accuracy in LC staging experiments, outperforming GPT-4o, which recorded 39% accuracy with REK and 25% without. In addition, appropriate prompt engineering can enhance the performance of general-purpose LLMs on specific tasks. Most of the studies included in our review used directives, prompt templates, and fine-tuning. Prompt templates often incorporated role descriptions, case examples, task requirements, LC-specific knowledge, and formatting instructions. Fine-tuning involves retraining a pretrained LLM (eg, ChatGPT and BERT) using labeled data for a specific task or domain to improve its performance on domain-specific tasks [<xref ref-type="bibr" rid="ref76">76</xref>]. A study by Arzideh et al [<xref ref-type="bibr" rid="ref77">77</xref>], comparing the extraction of clinical entities from unstructured medical records of patients with LC, found that a fine-tuned BERT model using annotated data achieved a higher <italic>F</italic><sub>1</sub>-score than an instruction-based LLM. Similarly, Zhu et al [<xref ref-type="bibr" rid="ref78">78</xref>] developed an open-source, oncology-specific LLM using a stacked alignment and fine-tuning process, which outperformed ChatGPT on medical benchmarks and achieved an area under the receiver operating characteristic curve of 0.95 for LC detection.</p><p>The studies included in this paper all used open-source LLMs; however, when deploying open-source LLMs in the cloud, issues related to data security and privacy protection are inevitable. Only 6 studies[20,31,33,38,42,43] have explicitly proposed specific data security measures, including legal constraints, such as the Health Insurance Portability and Accountability Act (HIPAA) [<xref ref-type="bibr" rid="ref20">20</xref>] or standard protocols [<xref ref-type="bibr" rid="ref38">38</xref>], data access restrictions [<xref ref-type="bibr" rid="ref33">33</xref>], and data anonymization [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]. With the widespread adoption of LLMs in medical settings and growing awareness of data security, hospitals with significant application demands opt to deploy open-source LLMs locally, enabling models and data to operate entirely within the hospital intranet and thereby avoiding risks associated with cloud transmission [<xref ref-type="bibr" rid="ref79">79</xref>]. They also mitigate data leakage risks through methods such as data anonymization and deidentification [<xref ref-type="bibr" rid="ref80">80</xref>], federated learning [<xref ref-type="bibr" rid="ref81">81</xref>,<xref ref-type="bibr" rid="ref82">82</xref>], and differential privacy [<xref ref-type="bibr" rid="ref83">83</xref>], among others. In the future, continued technological advancements and regulatory improvements, strengthened data supervision mechanisms, and a balanced approach between cost and performance will be essential to protect patient privacy.</p><p>At the same time, it should be acknowledged that LLMs cannot fully replace medical professionals, and it is necessary to clarify the responsibility attribution of LLMs in real clinical scenarios. Ethical frameworks should be established based on the needs of different medical scenarios and acceptable thresholds for patients and applied in a targeted manner [<xref ref-type="bibr" rid="ref84">84</xref>]. Key applications with low risk of harm to patients&#x2019; health can be prioritized, such as patient registration codes [<xref ref-type="bibr" rid="ref85">85</xref>], screening [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref86">86</xref>], and extraction of key information from medical records [<xref ref-type="bibr" rid="ref87">87</xref>]. Through a &#x201C;human-on-the-loop&#x201D; human-machine collaboration model, reinforcement learning techniques are introduced to optimize prompt strategies and model decisions, enhance model transparency and clinician engagement, and strengthen human oversight.</p></sec><sec id="s4-4"><title>Limitations of This Systematic Review</title><p>This review includes studies published up to January 1, 2025. Due to the rapid development of LLMs and fast publication cycles, some recent findings may have been missed. To address this, we expedited manuscript preparation and included several additional studies from the past 7 months (from January to July 2025) in the discussion. To ensure the comprehensiveness and relevance of this review, we included all studies that provided complete data and full-text availability. However, some of the included conference papers and preprints may not have undergone peer review, potentially affecting the reliability of the findings. Nonetheless, our quality assessment indicated that their risk of bias did not differ significantly from that of peer-reviewed journal articles. Although 6 databases were searched, relevant studies outside these sources may have been overlooked. We also limited inclusion to English-language articles, which may affect generalizability, although only 2 non-English articles were excluded. Meanwhile, research conducted across different countries may be affected by population diversity and bias in training datasets. Unlike traditional reviews of clinical interventions, this study applied different quality assessment methods tailored to various application scenarios. Some criteria relied on subjective judgment, and the complexity of the process may have introduced bias. To minimize this, 2 researchers (SC and ZL) assessed studies independently, discrepancies were resolved with a third reviewer, and final decisions were validated by 2 experts (LG and KH).</p></sec><sec id="s4-5"><title>Conclusions</title><p>In summary, this systematic review offers an overview of the applications and research involving LLMs in LC, accompanied by a quality assessment. LLMs can assist physicians in interpreting test reports, delivering diagnostic and treatment recommendations, and supporting education, research, and public outreach efforts. The development of multimodal models, data quality, privacy-preserving mechanisms, and advanced LLM architectures is key to integrating these technologies into the full-cycle management of LC care. Within an ethical framework and under appropriate human oversight, future efforts should focus on validating LLM applications in real-world clinical settings and the inclusion of underrepresented populations to ensure population diversity, ultimately promoting their development toward greater specialization, accuracy, and patient-centeredness.</p></sec></sec></body><back><ack><p>This work was supported by the Beijing University of Chinese Medicine East Hospital and Beijing Municipal Science &#x0026; Technology Commission. This research was funded by National Key R&#x0026;D Program of China (2024YFC3505400), The Science and Technology Plan Project of Beijing (grant Z221100003522029 and grant Z241100007724010), Education Science Research Project, National High Level Chinese Medicine Hospital Clinical Research Funding (DFRCZY-2024GJRC009 and DFRCZY-2024GJRC017).</p></ack><notes><sec><title>Data Availability</title><p>The data that support the findings of this study are available from the corresponding author upon reasonable request.</p></sec></notes><fn-group><fn fn-type="con"><p>KH and LG conceived the study and contributed equally. RZ and SC collected the data and wrote the manuscript. RZ, SC, and ZL extracted information and conducted quality assessment. TG and YS added references and enriched the discussion section. DL and WZ polished the English content of the manuscript. RZ, SC, LG, and KH revised and reviewed the manuscript.</p><p>Gao Lei and Hu Kaiwen are co-corresponding authors and contributed equally to this work.</p><p>Ruikang Zhong and Siyi Chen contributed equally to this work.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations:</title><def-list><def-item><term id="abb1">CT</term><def><p>computed tomography</p></def></def-item><def-item><term id="abb2">GI</term><def><p>gastrointestinal</p></def></def-item><def-item><term id="abb3">HIPAA </term><def><p>Health Insurance Portability and Accountability Act</p></def></def-item><def-item><term id="abb4">LC</term><def><p>lung cancer</p></def></def-item><def-item><term id="abb5">LLM</term><def><p>large language model</p></def></def-item><def-item><term id="abb6">NSCLC</term><def><p>non-small cell carcinoma</p></def></def-item><def-item><term id="abb7">OS</term><def><p>overall survival</p></def></def-item><def-item><term id="abb8">PRISMA</term><def><p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses</p></def></def-item><def-item><term id="abb9">PROBAST</term><def><p>Prediction model Risk Of Bias Assessment Tool</p></def></def-item><def-item><term id="abb10">PROSPERO</term><def><p>Prospective Register of Systematic Reviews</p></def></def-item><def-item><term id="abb11">QUADAS-2</term><def><p>Quality Assessment of Diagnostic Accuracy Studies-2</p></def></def-item><def-item><term id="abb12">RADS</term><def><p>Reporting and Data System</p></def></def-item><def-item><term id="abb13">RAG</term><def><p>retrieval-augmented generation</p></def></def-item><def-item><term id="abb14">REK</term><def><p>reliable external knowledge</p></def></def-item><def-item><term id="abb15">ROBINS-I</term><def><p>Risk Of Bias In Non-randomized Studies - of Interventions</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Siegel</surname><given-names>RL</given-names> </name><name name-style="western"><surname>Kratzer</surname><given-names>TB</given-names> </name><name name-style="western"><surname>Giaquinto</surname><given-names>AN</given-names> </name><name name-style="western"><surname>Sung</surname><given-names>H</given-names> </name><name name-style="western"><surname>Jemal</surname><given-names>A</given-names> </name></person-group><article-title>Cancer statistics, 2025</article-title><source>CA Cancer J Clin</source><year>2025</year><volume>75</volume><issue>1</issue><fpage>10</fpage><lpage>45</lpage><pub-id pub-id-type="doi">10.3322/caac.21871</pub-id><pub-id pub-id-type="medline">39817679</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bray</surname><given-names>F</given-names> </name><name name-style="western"><surname>Laversanne</surname><given-names>M</given-names> </name><name name-style="western"><surname>Sung</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Global cancer statistics 2022: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries</article-title><source>CA Cancer J Clin</source><year>2024</year><volume>74</volume><issue>3</issue><fpage>229</fpage><lpage>263</lpage><pub-id pub-id-type="doi">10.3322/caac.21834</pub-id><pub-id pub-id-type="medline">38572751</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Thiruvengadam</surname><given-names>R</given-names> </name><name name-style="western"><surname>Singh</surname><given-names>CD</given-names> </name><name name-style="western"><surname>Kondapavuluri</surname><given-names>BK</given-names> </name><name name-style="western"><surname>Gurusamy</surname><given-names>S</given-names> </name><name name-style="western"><surname>Venkidasamy</surname><given-names>B</given-names> </name><name name-style="western"><surname>Thiruvengadam</surname><given-names>M</given-names> </name></person-group><article-title>Biomarkers in lung cancer treatment</article-title><source>Clin Chim Acta</source><year>2025</year><month>05</month><day>15</day><volume>572</volume><fpage>120267</fpage><pub-id pub-id-type="doi">10.1016/j.cca.2025.120267</pub-id><pub-id pub-id-type="medline">40154724</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Peeters</surname><given-names>S</given-names> </name><name name-style="western"><surname>Lau</surname><given-names>K</given-names> </name><name name-style="western"><surname>Stefanidis</surname><given-names>K</given-names> </name><etal/></person-group><article-title>New diagnostic and nonsurgical local treatment modalities for early stage lung cancer</article-title><source>Lung Cancer (Auckl)</source><year>2024</year><month>10</month><volume>196</volume><fpage>107952</fpage><pub-id pub-id-type="doi">10.1016/j.lungcan.2024.107952</pub-id><pub-id pub-id-type="medline">39236577</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>The National Lung Screening Trial Research Team</collab><name name-style="western"><surname>Adams</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Aberle</surname><given-names>DR</given-names> </name></person-group><article-title>Reduced lung-cancer mortality with low-dose computed tomographic screening</article-title><source>N Engl J Med</source><year>2011</year><month>08</month><day>4</day><volume>365</volume><issue>5</issue><fpage>395</fpage><lpage>409</lpage><pub-id pub-id-type="doi">10.1056/NEJMoa1102873</pub-id><pub-id pub-id-type="medline">31995683</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jonas</surname><given-names>DE</given-names> </name><name name-style="western"><surname>Reuland</surname><given-names>DS</given-names> </name><name name-style="western"><surname>Reddy</surname><given-names>SM</given-names> </name><etal/></person-group><article-title>Screening for lung cancer with low-dose computed tomography: updated evidence report and systematic review for the US preventive services task force</article-title><source>JAMA</source><year>2021</year><month>03</month><day>9</day><volume>325</volume><issue>10</issue><fpage>971</fpage><lpage>987</lpage><pub-id pub-id-type="doi">10.1001/jama.2021.0377</pub-id><pub-id pub-id-type="medline">33687468</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>HJ</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>MK</given-names> </name></person-group><article-title>Effectiveness of nursing interventions based on lung cancer trajectory: a systematic review and meta-analysis</article-title><source>Int Nurs Rev</source><year>2025</year><month>09</month><volume>72</volume><issue>3</issue><fpage>e13074</fpage><pub-id pub-id-type="doi">10.1111/inr.13074</pub-id><pub-id pub-id-type="medline">39604008</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xiang</surname><given-names>R</given-names> </name><name name-style="western"><surname>Li</surname><given-names>Q</given-names> </name></person-group><article-title>Development status and thinking of the &#x201C;integrated diagnosis and treatment, full-course management&#x201D; model of lung cancer- based on the experience of the lung cancer MDT team of Sichuan Cancer Hospital</article-title><source>Zhongguo Fei Ai Za Zhi</source><year>2020</year><month>04</month><day>20</day><volume>23</volume><issue>4</issue><fpage>211</fpage><lpage>215</lpage><pub-id pub-id-type="doi">10.3779/j.issn.1009-3419.2020.101.12</pub-id><pub-id pub-id-type="medline">32316710</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lucas</surname><given-names>HC</given-names> </name><name name-style="western"><surname>Upperman</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Robinson</surname><given-names>JR</given-names> </name></person-group><article-title>A systematic review of large language models and their implications in medical education</article-title><source>Med Educ</source><year>2024</year><month>11</month><volume>58</volume><issue>11</issue><fpage>1276</fpage><lpage>1285</lpage><pub-id pub-id-type="doi">10.1111/medu.15402</pub-id><pub-id pub-id-type="medline">38639098</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Zhao</surname><given-names>W</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zhou</surname><given-names>K</given-names> </name><etal/></person-group><article-title>A survey of large language models</article-title><source>arXiv</source><comment>Preprint posted online on  Mar 31, 2023</comment><pub-id pub-id-type="doi">10.48550/arXiv.2303.18223</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Turner</surname><given-names>JH</given-names> </name></person-group><article-title>Triangle of trust in cancer care? The physician, the patient, and artificial intelligence chatbot</article-title><source>Cancer Biother Radiopharm</source><year>2023</year><month>11</month><volume>38</volume><issue>9</issue><fpage>581</fpage><lpage>584</lpage><pub-id pub-id-type="doi">10.1089/cbr.2023.0112</pub-id><pub-id pub-id-type="medline">37707991</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zack</surname><given-names>T</given-names> </name><name name-style="western"><surname>Lehman</surname><given-names>E</given-names> </name><name name-style="western"><surname>Suzgun</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Assessing the potential of GPT-4 to perpetuate racial and gender biases in health care: a model evaluation study</article-title><source>Lancet Digit Health</source><year>2024</year><month>01</month><volume>6</volume><issue>1</issue><fpage>e12</fpage><lpage>e22</lpage><pub-id pub-id-type="doi">10.1016/S2589-7500(23)00225-X</pub-id><pub-id pub-id-type="medline">38123252</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Athaluri</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Manthena</surname><given-names>SV</given-names> </name><name name-style="western"><surname>Kesapragada</surname><given-names>V</given-names> </name><name name-style="western"><surname>Yarlagadda</surname><given-names>V</given-names> </name><name name-style="western"><surname>Dave</surname><given-names>T</given-names> </name><name name-style="western"><surname>Duddumpudi</surname><given-names>RTS</given-names> </name></person-group><article-title>Exploring the boundaries of reality: investigating the phenomenon of artificial intelligence hallucination in scientific writing through ChatGPT references</article-title><source>Cureus</source><year>2023</year><month>04</month><volume>15</volume><issue>4</issue><fpage>e37432</fpage><pub-id pub-id-type="doi">10.7759/cureus.37432</pub-id><pub-id pub-id-type="medline">37182055</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Garg</surname><given-names>A</given-names> </name><name name-style="western"><surname>Gupta</surname><given-names>S</given-names> </name><name name-style="western"><surname>Vats</surname><given-names>S</given-names> </name><name name-style="western"><surname>Handa</surname><given-names>P</given-names> </name><name name-style="western"><surname>Goel</surname><given-names>N</given-names> </name></person-group><article-title>Prospect of large language models and natural language processing for lung cancer diagnosis: a systematic review</article-title><source>Expert Systems</source><year>2024</year><month>11</month><access-date>2025-09-17</access-date><volume>41</volume><issue>11</issue><fpage>e13697</fpage><comment><ext-link ext-link-type="uri" xlink:href="https://onlinelibrary.wiley.com/toc/14680394/41/11">https://onlinelibrary.wiley.com/toc/14680394/41/11</ext-link></comment><pub-id pub-id-type="doi">10.1111/exsy.13697</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Page</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>McKenzie</surname><given-names>JE</given-names> </name><name name-style="western"><surname>Bossuyt</surname><given-names>PM</given-names> </name><etal/></person-group><article-title>The PRISMA 2020 statement: an updated guideline for reporting systematic reviews</article-title><source>BMJ</source><year>2021</year><month>03</month><day>29</day><volume>372</volume><fpage>n71</fpage><pub-id pub-id-type="doi">10.1136/bmj.n71</pub-id><pub-id pub-id-type="medline">33782057</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Omar</surname><given-names>M</given-names> </name><name name-style="western"><surname>Levkovich</surname><given-names>I</given-names> </name></person-group><article-title>Exploring the efficacy and potential of large language models for depression: a systematic review</article-title><source>J Affect Disord</source><year>2025</year><month>02</month><day>15</day><volume>371</volume><fpage>234</fpage><lpage>244</lpage><pub-id pub-id-type="doi">10.1016/j.jad.2024.11.052</pub-id><pub-id pub-id-type="medline">39581383</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Whiting</surname><given-names>PF</given-names> </name><name name-style="western"><surname>Rutjes</surname><given-names>AWS</given-names> </name><name name-style="western"><surname>Westwood</surname><given-names>ME</given-names> </name><etal/></person-group><article-title>QUADAS-2: a revised tool for the quality assessment of diagnostic accuracy studies</article-title><source>Ann Intern Med</source><year>2011</year><month>10</month><day>18</day><volume>155</volume><issue>8</issue><fpage>529</fpage><lpage>536</lpage><pub-id pub-id-type="doi">10.7326/0003-4819-155-8-201110180-00009</pub-id><pub-id pub-id-type="medline">22007046</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moons</surname><given-names>KGM</given-names> </name><name name-style="western"><surname>Wolff</surname><given-names>RF</given-names> </name><name name-style="western"><surname>Riley</surname><given-names>RD</given-names> </name><etal/></person-group><article-title>PROBAST: a tool to assess risk of bias and applicability of prediction model studies: explanation and elaboration</article-title><source>Ann Intern Med</source><year>2019</year><month>01</month><day>1</day><volume>170</volume><issue>1</issue><fpage>W1</fpage><lpage>W33</lpage><pub-id pub-id-type="doi">10.7326/M18-1377</pub-id><pub-id pub-id-type="medline">30596876</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sterne</surname><given-names>JA</given-names> </name><name name-style="western"><surname>Hern&#x00E1;n</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Reeves</surname><given-names>BC</given-names> </name><etal/></person-group><article-title>ROBINS-I: a tool for assessing risk of bias in non-randomised studies of interventions</article-title><source>BMJ</source><year>2016</year><month>10</month><day>12</day><volume>355</volume><fpage>i4919</fpage><pub-id pub-id-type="doi">10.1136/bmj.i4919</pub-id><pub-id pub-id-type="medline">27733354</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bhattarai</surname><given-names>K</given-names> </name><name name-style="western"><surname>Oh</surname><given-names>IY</given-names> </name><name name-style="western"><surname>Sierra</surname><given-names>JM</given-names> </name><etal/></person-group><article-title>Leveraging GPT-4 for identifying cancer phenotypes in electronic health records: a performance comparison between GPT-4, GPT-3.5-turbo, Flan-T5, Llama-3-8B, and spaCy&#x2019;s rule-based and machine learning-based methods</article-title><source>JAMIA Open</source><year>2024</year><month>10</month><volume>7</volume><issue>3</issue><fpage>ooae060</fpage><pub-id pub-id-type="doi">10.1093/jamiaopen/ooae060</pub-id><pub-id pub-id-type="medline">38962662</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fink</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Bischoff</surname><given-names>A</given-names> </name><name name-style="western"><surname>Fink</surname><given-names>CA</given-names> </name><etal/></person-group><article-title>Potential of ChatGPT and GPT-4 for data mining of free-text CT reports on lung cancer</article-title><source>Radiology</source><year>2023</year><month>09</month><volume>308</volume><issue>3</issue><fpage>e231362</fpage><pub-id pub-id-type="doi">10.1148/radiol.231362</pub-id><pub-id pub-id-type="medline">37724963</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hu</surname><given-names>D</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>B</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Lu</surname><given-names>XD</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>N</given-names> </name></person-group><article-title>Zero-shot information extraction from radiological reports using ChatGPT</article-title><source>Int J Med Inform</source><year>2024</year><month>03</month><volume>183</volume><fpage>105321</fpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2023.105321</pub-id><pub-id pub-id-type="medline">38157785</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Naik</surname><given-names>N</given-names> </name><name name-style="western"><surname>Khandelwal</surname><given-names>A</given-names> </name><name name-style="western"><surname>Joshi</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Applying large language models for causal structure learning in non small cell lung cancer</article-title><conf-name>2024 IEEE 12th International Conference on Healthcare Informatics (ICHI)</conf-name><conf-date>Jun 3, 2024</conf-date><conf-loc>Orlando, FL, USA</conf-loc><pub-id pub-id-type="doi">10.1109/ICHI61247.2024.00110</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Niu</surname><given-names>C</given-names> </name><name name-style="western"><surname>Kaviani</surname><given-names>P</given-names> </name><name name-style="western"><surname>Lyu</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Kalra</surname><given-names>MK</given-names> </name><name name-style="western"><surname>Whitlow</surname><given-names>CT</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>G</given-names> </name></person-group><article-title>Cross-institutional structured radiology reporting for lung cancer screening using a dynamic template-constrained large language model</article-title><source>arXiv</source><comment>Preprint posted online on  Sep 26, 2024</comment><pub-id pub-id-type="doi">10.48550/arXiv.2409.18319</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>K</given-names> </name><name name-style="western"><surname>Paek</surname><given-names>H</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>LC</given-names> </name><etal/></person-group><article-title>SEETrials: leveraging large language models for safety and efficacy extraction in oncology clinical trials</article-title><source>Inform Med Unlocked</source><year>2024</year><volume>50</volume><fpage>101589</fpage><pub-id pub-id-type="doi">10.1016/j.imu.2024.101589</pub-id><pub-id pub-id-type="medline">39493413</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lyu</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zapadka</surname><given-names>ME</given-names> </name><etal/></person-group><article-title>Translating radiology reports into plain language using ChatGPT and GPT-4 with prompt learning: results, limitations, and potential</article-title><source>Vis Comput Ind Biomed Art</source><year>2023</year><month>05</month><day>18</day><volume>6</volume><issue>1</issue><fpage>9</fpage><pub-id pub-id-type="doi">10.1186/s42492-023-00136-5</pub-id><pub-id pub-id-type="medline">37198498</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ferrari-Light</surname><given-names>D</given-names> </name><name name-style="western"><surname>Merritt</surname><given-names>RE</given-names> </name><name name-style="western"><surname>D&#x2019;Souza</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Evaluating ChatGPT as a patient resource for frequently asked questions about lung cancer surgery-a pilot study</article-title><source>J Thorac Cardiovasc Surg</source><year>2025</year><month>04</month><volume>169</volume><issue>4</issue><fpage>1174</fpage><lpage>1180</lpage><pub-id pub-id-type="doi">10.1016/j.jtcvs.2024.09.030</pub-id><pub-id pub-id-type="medline">39326732</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gencer</surname><given-names>A</given-names> </name></person-group><article-title>Readability analysis of ChatGPT&#x2019;s responses on lung cancer</article-title><source>Sci Rep</source><year>2024</year><month>07</month><day>26</day><volume>14</volume><issue>1</issue><fpage>17234</fpage><pub-id pub-id-type="doi">10.1038/s41598-024-67293-2</pub-id><pub-id pub-id-type="medline">39060365</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Haver</surname><given-names>HL</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>CT</given-names> </name><name name-style="western"><surname>Sirajuddin</surname><given-names>A</given-names> </name><name name-style="western"><surname>Yi</surname><given-names>PH</given-names> </name><name name-style="western"><surname>Jeudy</surname><given-names>J</given-names> </name></person-group><article-title>Use of ChatGPT, GPT-4, and Bard to improve readability of ChatGPT&#x2019;s answers to common questions about lung cancer and lung cancer screening</article-title><source>AJR Am J Roentgenol</source><year>2023</year><month>11</month><volume>221</volume><issue>5</issue><fpage>701</fpage><lpage>704</lpage><pub-id pub-id-type="doi">10.2214/AJR.23.29622</pub-id><pub-id pub-id-type="medline">37341179</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Janopaul-Naylor</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Koo</surname><given-names>A</given-names> </name><name name-style="western"><surname>Qian</surname><given-names>DC</given-names> </name><name name-style="western"><surname>McCall</surname><given-names>NS</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Patel</surname><given-names>SA</given-names> </name></person-group><article-title>Physician assessment of ChatGPT and Bing answers to American Cancer Society&#x2019;s questions to ask about your cancer</article-title><source>Am J Clin Oncol</source><year>2024</year><month>01</month><day>1</day><volume>47</volume><issue>1</issue><fpage>17</fpage><lpage>21</lpage><pub-id pub-id-type="doi">10.1097/COC.0000000000001050</pub-id><pub-id pub-id-type="medline">37823708</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rogasch</surname><given-names>JMM</given-names> </name><name name-style="western"><surname>Metzger</surname><given-names>G</given-names> </name><name name-style="western"><surname>Preisler</surname><given-names>M</given-names> </name><etal/></person-group><article-title>ChatGPT: can you prepare my patients for [<sup>18</sup>F]FDG PET/CT and explain my reports?</article-title><source>J Nucl Med</source><year>2023</year><month>12</month><day>1</day><volume>64</volume><issue>12</issue><fpage>1876</fpage><lpage>1879</lpage><pub-id pub-id-type="doi">10.2967/jnumed.123.266114</pub-id><pub-id pub-id-type="medline">37709536</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rahsepar</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Tavakoli</surname><given-names>N</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>GHJ</given-names> </name><name name-style="western"><surname>Hassani</surname><given-names>C</given-names> </name><name name-style="western"><surname>Abtin</surname><given-names>F</given-names> </name><name name-style="western"><surname>Bedayat</surname><given-names>A</given-names> </name></person-group><article-title>How AI responds to common lung cancer questions: ChatGPT vs Google Bard</article-title><source>Radiology</source><year>2023</year><month>06</month><volume>307</volume><issue>5</issue><fpage>e230922</fpage><pub-id pub-id-type="doi">10.1148/radiol.230922</pub-id><pub-id pub-id-type="medline">37310252</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cho</surname><given-names>H</given-names> </name><name name-style="western"><surname>Yoo</surname><given-names>S</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>B</given-names> </name><etal/></person-group><article-title>Extracting lung cancer staging descriptors from pathology reports: a generative language model approach</article-title><source>J Biomed Inform</source><year>2024</year><month>09</month><volume>157</volume><fpage>104720</fpage><pub-id pub-id-type="doi">10.1016/j.jbi.2024.104720</pub-id><pub-id pub-id-type="medline">39233209</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dehdab</surname><given-names>R</given-names> </name><name name-style="western"><surname>Brendlin</surname><given-names>A</given-names> </name><name name-style="western"><surname>Werner</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Evaluating ChatGPT-4V in chest CT diagnostics: a critical image interpretation assessment</article-title><source>Jpn J Radiol</source><year>2024</year><month>10</month><volume>42</volume><issue>10</issue><fpage>1168</fpage><lpage>1177</lpage><pub-id pub-id-type="doi">10.1007/s11604-024-01606-3</pub-id><pub-id pub-id-type="medline">38867035</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Hu</surname><given-names>D</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>B</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>N</given-names> </name></person-group><article-title>The power of combining data and knowledge: GPT-4o is an effective interpreter of machine learning models in predicting lymph node metastasis of lung cancer</article-title><source>arXiv</source><comment>Preprint posted online on  Jul 25, 2024</comment><pub-id pub-id-type="doi">10.48550/arXiv.2407.17900</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>DM</given-names> </name><name name-style="western"><surname>Rong</surname><given-names>R</given-names> </name><etal/></person-group><article-title>A critical assessment of using ChatGPT for extracting structured data from clinical notes</article-title><source>NPJ Digit Med</source><year>2024</year><month>05</month><day>1</day><volume>7</volume><issue>1</issue><fpage>106</fpage><pub-id pub-id-type="doi">10.1038/s41746-024-01079-8</pub-id><pub-id pub-id-type="medline">38693429</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yasaka</surname><given-names>K</given-names> </name><name name-style="western"><surname>Kanzawa</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kanemaru</surname><given-names>N</given-names> </name><name name-style="western"><surname>Koshino</surname><given-names>S</given-names> </name><name name-style="western"><surname>Abe</surname><given-names>O</given-names> </name></person-group><article-title>Fine-tuned large language model for extracting patients on pretreatment for lung cancer from a picture archiving and communication system based on radiological reports</article-title><source>J Imaging Inform Med</source><year>2025</year><month>02</month><volume>38</volume><issue>1</issue><fpage>327</fpage><lpage>334</lpage><pub-id pub-id-type="doi">10.1007/s10278-024-01186-8</pub-id><pub-id pub-id-type="medline">38955964</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Vallabhaneni</surname><given-names>GV</given-names> </name><name name-style="western"><surname>Rahul</surname><given-names>YS</given-names> </name><name name-style="western"><surname>Kumari</surname><given-names>KS</given-names> </name></person-group><article-title>Improved lung cancer detection through use of large language systems with graphical attributes</article-title><year>2024</year><month>05</month><conf-name>2024 IEEE International Conference on Computing, Power and Communication Technologies (IC2PCT)</conf-name><conf-date>Feb 9-10, 2024</conf-date><conf-loc>Greater Noida, India</conf-loc><pub-id pub-id-type="doi">10.1109/IC2PCT60090.2024.10486290</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Qu</surname><given-names>LH</given-names> </name><name name-style="western"><surname>Luo</surname><given-names>XY</given-names> </name><name name-style="western"><surname>Fu</surname><given-names>KX</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>MN</given-names> </name><name name-style="western"><surname>Song</surname><given-names>ZJ</given-names> </name></person-group><article-title>The rise of AI language pathologists: exploring two-level prompt learning for few-shot weakly-supervised whole slide image classification</article-title><source>arXiv</source><comment>Preprint posted online on  May 29, 2023</comment><pub-id pub-id-type="doi">10.48550/arXiv.2305.17891</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Panagoulias</surname><given-names>DP</given-names> </name><name name-style="western"><surname>Palamidas</surname><given-names>FA</given-names> </name><name name-style="western"><surname>Virvou</surname><given-names>M</given-names> </name><name name-style="western"><surname>Tsihrintzis</surname><given-names>GA</given-names> </name></person-group><article-title>Evaluation of chatgpt-supported diagnosis, staging and treatment planning for the case of lung cancer</article-title><year>2024</year><month>11</month><conf-name>2023 20th ACS/IEEE International Conference on Computer Systems and Applications (AICCSA)</conf-name><conf-date>Dec 4-7, 2023</conf-date><conf-loc>Giza, Egypt</conf-loc><pub-id pub-id-type="doi">10.1109/AICCSA59173.2023.10479348</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Mithun</surname><given-names>S</given-names> </name><name name-style="western"><surname>Sherkhane</surname><given-names>UB</given-names> </name><name name-style="western"><surname>Jha</surname><given-names>AK</given-names> </name><etal/></person-group><article-title>Transfer learning with BERT and ClinicalBERT models for multiclass classification of radiology imaging reports</article-title><comment>Preprint posted online on  Jul 22, 2024</comment><pub-id pub-id-type="doi">10.21203/rs.3.rs-4443132/v1</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>JE</given-names> </name><name name-style="western"><surname>Park</surname><given-names>KS</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>YH</given-names> </name><name name-style="western"><surname>Song</surname><given-names>HC</given-names> </name><name name-style="western"><surname>Park</surname><given-names>B</given-names> </name><name name-style="western"><surname>Jeong</surname><given-names>YJ</given-names> </name></person-group><article-title>Lung cancer staging using chest CT and FDG PET/CT free-text reports: comparison among three ChatGPT large language models and six human readers of varying experience</article-title><source>AJR Am J Roentgenol</source><year>2024</year><month>12</month><volume>223</volume><issue>6</issue><fpage>e2431696</fpage><pub-id pub-id-type="doi">10.2214/AJR.24.31696</pub-id><pub-id pub-id-type="medline">39230409</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dong</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Gay</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Large-language-model empowered 3D dose prediction for intensity-modulated radiotherapy</article-title><source>Med Phys</source><year>2025</year><month>01</month><volume>52</volume><issue>1</issue><fpage>619</fpage><lpage>632</lpage><pub-id pub-id-type="doi">10.1002/mp.17416</pub-id><pub-id pub-id-type="medline">39316523</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jeong</surname><given-names>S</given-names> </name><name name-style="western"><surname>Pyo</surname><given-names>H</given-names> </name><name name-style="western"><surname>Park</surname><given-names>W</given-names> </name><name name-style="western"><surname>Han</surname><given-names>Y</given-names> </name></person-group><article-title>The prediction of stress in radiation therapy: integrating artificial intelligence with biological signals</article-title><source>Cancers (Basel)</source><year>2024</year><month>05</month><day>22</day><volume>16</volume><issue>11</issue><fpage>1964</fpage><pub-id pub-id-type="doi">10.3390/cancers16111964</pub-id><pub-id pub-id-type="medline">38893087</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dos Santos</surname><given-names>FC</given-names> </name><name name-style="western"><surname>Johnson</surname><given-names>LG</given-names> </name><name name-style="western"><surname>Madandola</surname><given-names>OO</given-names> </name><etal/></person-group><article-title>An example of leveraging AI for documentation: ChatGPT-generated nursing care plan for an older adult with lung cancer</article-title><source>J Am Med Inform Assoc</source><year>2024</year><month>09</month><day>1</day><volume>31</volume><issue>9</issue><fpage>2089</fpage><lpage>2096</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocae116</pub-id><pub-id pub-id-type="medline">38758655</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Ye</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>L</given-names> </name><name name-style="western"><surname>Guo</surname><given-names>NL</given-names> </name><name name-style="western"><surname>Hu</surname><given-names>GQ</given-names> </name></person-group><article-title>Scientific figures interpreted by ChatGPT: strengths in plot recognition and limits in color perception</article-title><source>NPJ Precis Oncol</source><year>2024</year><month>04</month><day>5</day><volume>8</volume><issue>1</issue><fpage>84</fpage><pub-id pub-id-type="doi">10.1038/s41698-024-00576-z</pub-id><pub-id pub-id-type="medline">38580746</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Devi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Uttrani</surname><given-names>S</given-names> </name><name name-style="western"><surname>Singla</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Automating clinical trial eligibility screening: quantitative analysis of GPT models versus human expertise</article-title><conf-name>17th International Conference on PErvasive Technologies Related to Assistive Environments</conf-name><conf-date>Jun 26, 2024</conf-date><conf-loc>Crete Greece</conf-loc><pub-id pub-id-type="doi">10.1145/3652037.3663922</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ashofteh Barabadi</surname><given-names>M</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Chan</surname><given-names>WY</given-names> </name><name name-style="western"><surname>Simpson</surname><given-names>AL</given-names> </name><name name-style="western"><surname>Do</surname><given-names>RKG</given-names> </name></person-group><article-title>Targeted generative data augmentation for automatic metastases detection from free-text radiology reports</article-title><source>Front Artif Intell</source><year>2025</year><volume>8</volume><fpage>1513674</fpage><pub-id pub-id-type="doi">10.3389/frai.2025.1513674</pub-id><pub-id pub-id-type="medline">39981192</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mao</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>N</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Assessments of lung nodules by an artificial intelligence chatbot using longitudinal CT images</article-title><source>Cell Rep Med</source><year>2025</year><month>03</month><day>18</day><volume>6</volume><issue>3</issue><fpage>101988</fpage><pub-id pub-id-type="doi">10.1016/j.xcrm.2025.101988</pub-id><pub-id pub-id-type="medline">40043704</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chansky</surname><given-names>K</given-names> </name><name name-style="western"><surname>Detterbeck</surname><given-names>FC</given-names> </name><name name-style="western"><surname>Nicholson</surname><given-names>AG</given-names> </name><etal/></person-group><article-title>The IASLC Lung Cancer Staging Project: external validation of the revision of the TNM stage groupings in the eighth edition of the TNM classification of lung cancer</article-title><source>J Thorac Oncol</source><year>2017</year><month>07</month><volume>12</volume><issue>7</issue><fpage>1109</fpage><lpage>1121</lpage><pub-id pub-id-type="doi">10.1016/j.jtho.2017.04.011</pub-id><pub-id pub-id-type="medline">28461257</pub-id></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bhamani</surname><given-names>A</given-names> </name><name name-style="western"><surname>Creamer</surname><given-names>A</given-names> </name><name name-style="western"><surname>Verghese</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Low-dose CT for lung cancer screening in a high-risk population (SUMMIT): a prospective, longitudinal cohort study</article-title><source>Lancet Oncol</source><year>2025</year><month>05</month><volume>26</volume><issue>5</issue><fpage>609</fpage><lpage>619</lpage><pub-id pub-id-type="doi">10.1016/S1470-2045(25)00082-8</pub-id></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ding</surname><given-names>H</given-names> </name><name name-style="western"><surname>Xia</surname><given-names>W</given-names> </name><name name-style="western"><surname>Zhou</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Evaluation and practical application of prompt-driven ChatGPTs for EMR generation</article-title><source>NPJ Digit Med</source><year>2025</year><month>02</month><day>2</day><volume>8</volume><issue>1</issue><fpage>77</fpage><pub-id pub-id-type="doi">10.1038/s41746-025-01472-x</pub-id><pub-id pub-id-type="medline">39894840</pub-id></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Singh</surname><given-names>R</given-names> </name><name name-style="western"><surname>Hamouda</surname><given-names>M</given-names> </name><name name-style="western"><surname>Chamberlin</surname><given-names>JH</given-names> </name><etal/></person-group><article-title>ChatGPT vs. Gemini: comparative accuracy and efficiency in Lung-RADS score assignment from radiology reports</article-title><source>Clin Imaging</source><year>2025</year><month>05</month><volume>121</volume><fpage>110455</fpage><pub-id pub-id-type="doi">10.1016/j.clinimag.2025.110455</pub-id><pub-id pub-id-type="medline">40090067</pub-id></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gong</surname><given-names>EJ</given-names> </name><name name-style="western"><surname>Bang</surname><given-names>CS</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>JJ</given-names> </name><etal/></person-group><article-title>Large language models in gastroenterology: systematic review</article-title><source>J Med Internet Res</source><year>2024</year><month>12</month><day>20</day><volume>26</volume><fpage>e66648</fpage><pub-id pub-id-type="doi">10.2196/66648</pub-id><pub-id pub-id-type="medline">39705703</pub-id></nlm-citation></ref><ref id="ref55"><label>55</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>L</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>WJ</given-names> </name><name name-style="western"><surname>Ma</surname><given-names>WT</given-names> </name><etal/></person-group><article-title>A survey on hallucination in large language models: principles, taxonomy, challenges, and open questions</article-title><source>arXiv</source><comment>Preprint posted online on  Nov 19, 2024</comment><pub-id pub-id-type="doi">10.48550/arXiv.2311.05232</pub-id></nlm-citation></ref><ref id="ref56"><label>56</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schulze Buschoff</surname><given-names>LM</given-names> </name><name name-style="western"><surname>Akata</surname><given-names>E</given-names> </name><name name-style="western"><surname>Bethge</surname><given-names>M</given-names> </name><name name-style="western"><surname>Schulz</surname><given-names>E</given-names> </name></person-group><article-title>Visual cognition in multimodal large language models</article-title><source>Nat Mach Intell</source><year>2025</year><volume>7</volume><issue>1</issue><fpage>96</fpage><lpage>106</lpage><pub-id pub-id-type="doi">10.1038/s42256-024-00963-y</pub-id></nlm-citation></ref><ref id="ref57"><label>57</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zabaleta</surname><given-names>J</given-names> </name><name name-style="western"><surname>Aguinagalde</surname><given-names>B</given-names> </name><name name-style="western"><surname>Lopez</surname><given-names>I</given-names> </name><etal/></person-group><article-title>Utility of artificial intelligence for decision making in thoracic multidisciplinary tumor boards</article-title><source>J Clin Med</source><year>2025</year><month>01</month><day>10</day><volume>14</volume><issue>2</issue><fpage>399</fpage><pub-id pub-id-type="doi">10.3390/jcm14020399</pub-id><pub-id pub-id-type="medline">39860405</pub-id></nlm-citation></ref><ref id="ref58"><label>58</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Brown</surname><given-names>EDL</given-names> </name><name name-style="western"><surname>Shah</surname><given-names>HA</given-names> </name><name name-style="western"><surname>Donnelly</surname><given-names>BM</given-names> </name><name name-style="western"><surname>Ward</surname><given-names>M</given-names> </name><name name-style="western"><surname>Vojnic</surname><given-names>M</given-names> </name><name name-style="western"><surname>D&#x2019;Amico</surname><given-names>RS</given-names> </name></person-group><article-title>Precision oncology in non-small cell lung cancer: a comparative study of contextualized ChatGPT models</article-title><source>Cureus</source><year>2025</year><month>03</month><volume>17</volume><issue>3</issue><fpage>e81097</fpage><pub-id pub-id-type="doi">10.7759/cureus.81097</pub-id><pub-id pub-id-type="medline">40271313</pub-id></nlm-citation></ref><ref id="ref59"><label>59</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Li</surname><given-names>M</given-names> </name><etal/></person-group><article-title>A feasibility study of automating radiotherapy planning with large language model agents</article-title><source>Phys Med Biol</source><year>2025</year><month>03</month><day>21</day><volume>70</volume><issue>7</issue><pub-id pub-id-type="doi">10.1088/1361-6560/adbff1</pub-id><pub-id pub-id-type="medline">40073507</pub-id></nlm-citation></ref><ref id="ref60"><label>60</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Paolo</surname><given-names>D</given-names> </name><name name-style="western"><surname>Greco</surname><given-names>C</given-names> </name><name name-style="western"><surname>Cortellini</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Hierarchical embedding attention for overall survival prediction in lung cancer from unstructured EHRs</article-title><source>BMC Med Inform Decis Mak</source><year>2025</year><month>04</month><day>18</day><volume>25</volume><issue>1</issue><fpage>169</fpage><pub-id pub-id-type="doi">10.1186/s12911-025-02998-6</pub-id><pub-id pub-id-type="medline">40251623</pub-id></nlm-citation></ref><ref id="ref61"><label>61</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yamagishi</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Nakamura</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Hanaoka</surname><given-names>S</given-names> </name><name name-style="western"><surname>Abe</surname><given-names>O</given-names> </name></person-group><article-title>Large language model approach for zero-shot information extraction and clustering of Japanese radiology reports: algorithm development and validation</article-title><source>JMIR Cancer</source><year>2025</year><month>01</month><day>23</day><volume>11</volume><fpage>e57275</fpage><pub-id pub-id-type="doi">10.2196/57275</pub-id><pub-id pub-id-type="medline">39864093</pub-id></nlm-citation></ref><ref id="ref62"><label>62</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Xiao</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Cross language transformation of free text into structured lobectomy surgical records from a multi center study</article-title><source>Sci Rep</source><year>2025</year><month>05</month><day>2</day><volume>15</volume><issue>1</issue><fpage>15417</fpage><pub-id pub-id-type="doi">10.1038/s41598-025-97500-7</pub-id><pub-id pub-id-type="medline">40316625</pub-id></nlm-citation></ref><ref id="ref63"><label>63</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Forsythe</surname><given-names>A</given-names> </name><name name-style="western"><surname>Rege</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Kaufman</surname><given-names>P</given-names> </name></person-group><article-title>BIO25-024: real-time clinical trial data library in non-small cell lung (NSCLC), prostate (PC), and breast cancer (BC) to support informed treatment decisions: now a reality with a fine-tuned large language model (LLM)</article-title><source>J Natl Compr Canc Netw</source><year>2025</year><month>03</month><day>28</day><volume>23</volume><issue>3.5</issue><fpage>BIO25-024</fpage><pub-id pub-id-type="doi">10.6004/jnccn.2024.7156</pub-id><pub-id pub-id-type="medline">40157350</pub-id></nlm-citation></ref><ref id="ref64"><label>64</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yuan</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>G</given-names> </name><name name-style="western"><surname>Gu</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Artificial intelligence-assisted machine learning models for predicting lung cancer survival</article-title><source>Asia Pac J Oncol Nurs</source><year>2025</year><month>12</month><volume>12</volume><fpage>100680</fpage><pub-id pub-id-type="doi">10.1016/j.apjon.2025.100680</pub-id><pub-id pub-id-type="medline">40201531</pub-id></nlm-citation></ref><ref id="ref65"><label>65</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xiang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>X</given-names> </name><etal/></person-group><article-title>A vision&#x2013;language foundation model for precision oncology</article-title><source>Nature New Biol</source><year>2025</year><month>02</month><day>20</day><volume>638</volume><issue>8051</issue><fpage>769</fpage><lpage>778</lpage><pub-id pub-id-type="doi">10.1038/s41586-024-08378-w</pub-id></nlm-citation></ref><ref id="ref66"><label>66</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Teramoto</surname><given-names>A</given-names> </name><name name-style="western"><surname>Michiba</surname><given-names>A</given-names> </name><name name-style="western"><surname>Kiriyama</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Tsukamoto</surname><given-names>T</given-names> </name><name name-style="western"><surname>Imaizumi</surname><given-names>K</given-names> </name><name name-style="western"><surname>Fujita</surname><given-names>H</given-names> </name></person-group><article-title>Automated description generation of cytologic findings for lung cytological images using a pretrained vision model and dual text decoders: preliminary study</article-title><source>Cytopathology</source><year>2025</year><month>05</month><volume>36</volume><issue>3</issue><fpage>240</fpage><lpage>249</lpage><pub-id pub-id-type="doi">10.1111/cyt.13474</pub-id><pub-id pub-id-type="medline">39918342</pub-id></nlm-citation></ref><ref id="ref67"><label>67</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lehr</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Caliskan</surname><given-names>A</given-names> </name><name name-style="western"><surname>Liyanage</surname><given-names>S</given-names> </name><name name-style="western"><surname>Banaji</surname><given-names>MR</given-names> </name></person-group><article-title>ChatGPT as research scientist: probing GPT&#x2019;s capabilities as a research librarian, research ethicist, data generator, and data predictor</article-title><source>Proc Natl Acad Sci U S A</source><year>2024</year><month>08</month><day>27</day><volume>121</volume><issue>35</issue><fpage>e2404328121</fpage><pub-id pub-id-type="doi">10.1073/pnas.2404328121</pub-id><pub-id pub-id-type="medline">39163339</pub-id></nlm-citation></ref><ref id="ref68"><label>68</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Singhal</surname><given-names>K</given-names> </name><name name-style="western"><surname>Tu</surname><given-names>T</given-names> </name><name name-style="western"><surname>Gottweis</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Toward expert-level medical question answering with large language models</article-title><source>Nat Med</source><year>2025</year><month>03</month><volume>31</volume><issue>3</issue><fpage>943</fpage><lpage>950</lpage><pub-id pub-id-type="doi">10.1038/s41591-024-03423-7</pub-id><pub-id pub-id-type="medline">39779926</pub-id></nlm-citation></ref><ref id="ref69"><label>69</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>J</given-names> </name><name name-style="western"><surname>Yoon</surname><given-names>W</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>S</given-names> </name><etal/></person-group><article-title>BioBERT: a pre-trained biomedical language representation model for biomedical text mining</article-title><source>Bioinformatics</source><year>2020</year><month>02</month><day>15</day><volume>36</volume><issue>4</issue><fpage>1234</fpage><lpage>1240</lpage><pub-id pub-id-type="doi">10.1093/bioinformatics/btz682</pub-id><pub-id pub-id-type="medline">31501885</pub-id></nlm-citation></ref><ref id="ref70"><label>70</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>K</given-names> </name><name name-style="western"><surname>Altosaar</surname><given-names>J</given-names> </name><name name-style="western"><surname>Ranganath</surname><given-names>R</given-names> </name></person-group><article-title>ClinicalBERT: modeling clinical notes and predicting hospital readmission</article-title><source>arXiv</source><comment>Preprint posted online on  Nov 29, 2020</comment><pub-id pub-id-type="doi">10.48550/arXiv.1904.05342</pub-id></nlm-citation></ref><ref id="ref71"><label>71</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Khalpey</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Kumar</surname><given-names>U</given-names> </name><name name-style="western"><surname>King</surname><given-names>N</given-names> </name><name name-style="western"><surname>Abraham</surname><given-names>A</given-names> </name><name name-style="western"><surname>Khalpey</surname><given-names>AH</given-names> </name></person-group><article-title>Large language models take on cardiothoracic surgery: a comparative analysis of the performance of four models on American Board of Thoracic Surgery Exam questions in 2023</article-title><source>Cureus</source><year>2024</year><month>07</month><volume>16</volume><issue>7</issue><fpage>e65083</fpage><pub-id pub-id-type="doi">10.7759/cureus.65083</pub-id><pub-id pub-id-type="medline">39171020</pub-id></nlm-citation></ref><ref id="ref72"><label>72</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Benary</surname><given-names>M</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>XD</given-names> </name><name name-style="western"><surname>Schmidt</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Leveraging large language models for decision support in personalized oncology</article-title><source>JAMA Netw Open</source><year>2023</year><month>11</month><day>1</day><volume>6</volume><issue>11</issue><fpage>e2343689</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2023.43689</pub-id><pub-id pub-id-type="medline">37976064</pub-id></nlm-citation></ref><ref id="ref73"><label>73</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Ammann</surname><given-names>PJL</given-names> </name><name name-style="western"><surname>Golde</surname><given-names>J</given-names> </name><name name-style="western"><surname>Akbik</surname><given-names>A</given-names> </name></person-group><article-title>Question decomposition for retrieval-augmented generation</article-title><source>arXiv</source><comment>Preprint posted online on  Jul 1, 2025</comment><pub-id pub-id-type="doi">10.48550/arXiv.2507.00355</pub-id></nlm-citation></ref><ref id="ref74"><label>74</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lammert</surname><given-names>J</given-names> </name><name name-style="western"><surname>Dreyer</surname><given-names>T</given-names> </name><name name-style="western"><surname>Mathes</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Expert-guided large language models for clinical decision support in precision oncology</article-title><source>JCO Precis Oncol</source><year>2024</year><month>10</month><volume>8</volume><fpage>e2400478</fpage><pub-id pub-id-type="doi">10.1200/PO-24-00478</pub-id><pub-id pub-id-type="medline">39475661</pub-id></nlm-citation></ref><ref id="ref75"><label>75</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tozuka</surname><given-names>R</given-names> </name><name name-style="western"><surname>Johno</surname><given-names>H</given-names> </name><name name-style="western"><surname>Amakawa</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Application of NotebookLM, a large language model with retrieval-augmented generation, for lung cancer staging</article-title><source>Jpn J Radiol</source><year>2025</year><month>04</month><volume>43</volume><issue>4</issue><fpage>706</fpage><lpage>712</lpage><pub-id pub-id-type="doi">10.1007/s11604-024-01705-1</pub-id><pub-id pub-id-type="medline">39585559</pub-id></nlm-citation></ref><ref id="ref76"><label>76</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Giuffr&#x00E8;</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kresevic</surname><given-names>S</given-names> </name><name name-style="western"><surname>Pugliese</surname><given-names>N</given-names> </name><name name-style="western"><surname>You</surname><given-names>K</given-names> </name><name name-style="western"><surname>Shung</surname><given-names>DL</given-names> </name></person-group><article-title>Optimizing large language models in digestive disease: strategies and challenges to improve clinical outcomes</article-title><source>Liver Int</source><year>2024</year><month>09</month><volume>44</volume><issue>9</issue><fpage>2114</fpage><lpage>2124</lpage><pub-id pub-id-type="doi">10.1111/liv.15974</pub-id><pub-id pub-id-type="medline">38819632</pub-id></nlm-citation></ref><ref id="ref77"><label>77</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Arzideh</surname><given-names>K</given-names> </name><name name-style="western"><surname>Sch&#x00E4;fer</surname><given-names>H</given-names> </name><name name-style="western"><surname>Allende-Cid</surname><given-names>H</given-names> </name><etal/></person-group><article-title>From BERT to generative AI - comparing encoder-only vs. large language models in a cohort of lung cancer patients for named entity recognition in unstructured medical reports</article-title><source>Comput Biol Med</source><year>2025</year><month>09</month><volume>195</volume><fpage>110665</fpage><pub-id pub-id-type="doi">10.1016/j.compbiomed.2025.110665</pub-id><pub-id pub-id-type="medline">40554973</pub-id></nlm-citation></ref><ref id="ref78"><label>78</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhu</surname><given-names>M</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>H</given-names> </name><name name-style="western"><surname>Jiang</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Large language model trained on clinical oncology data predicts cancer progression</article-title><source>NPJ Digit Med</source><year>2025</year><month>07</month><day>2</day><volume>8</volume><issue>1</issue><fpage>397</fpage><pub-id pub-id-type="doi">10.1038/s41746-025-01780-2</pub-id><pub-id pub-id-type="medline">40604229</pub-id></nlm-citation></ref><ref id="ref79"><label>79</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Khalid</surname><given-names>N</given-names> </name><name name-style="western"><surname>Qayyum</surname><given-names>A</given-names> </name><name name-style="western"><surname>Bilal</surname><given-names>M</given-names> </name><name name-style="western"><surname>Al-Fuqaha</surname><given-names>A</given-names> </name><name name-style="western"><surname>Qadir</surname><given-names>J</given-names> </name></person-group><article-title>Privacy-preserving artificial intelligence in healthcare: techniques and applications</article-title><source>Comput Biol Med</source><year>2023</year><month>05</month><volume>158</volume><fpage>106848</fpage><pub-id pub-id-type="doi">10.1016/j.compbiomed.2023.106848</pub-id><pub-id pub-id-type="medline">37044052</pub-id></nlm-citation></ref><ref id="ref80"><label>80</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Clunie</surname><given-names>D</given-names> </name><name name-style="western"><surname>Taylor</surname><given-names>A</given-names> </name><name name-style="western"><surname>Bisson</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Summary of the National Cancer Institute 2023 virtual workshop on medical image de-identification&#x2014;part 2: pathology whole slide image de-identification, de-facing, the role of AI in image de-identification, and the NCI MIDI datasets and pipeline</article-title><source>J Digit Imaging Inform med</source><year>2025</year><month>02</month><volume>38</volume><issue>1</issue><fpage>16</fpage><lpage>30</lpage><pub-id pub-id-type="doi">10.1007/s10278-024-01183-x</pub-id></nlm-citation></ref><ref id="ref81"><label>81</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhou</surname><given-names>S</given-names> </name><name name-style="western"><surname>Li</surname><given-names>GY</given-names> </name></person-group><article-title>Federated learning via inexact ADMM</article-title><source>IEEE Trans Pattern Anal Mach Intell</source><year>2023</year><month>08</month><volume>45</volume><issue>8</issue><fpage>9699</fpage><lpage>9708</lpage><pub-id pub-id-type="doi">10.1109/TPAMI.2023.3243080</pub-id><pub-id pub-id-type="medline">37022837</pub-id></nlm-citation></ref><ref id="ref82"><label>82</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>S</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>P</given-names> </name><name name-style="western"><surname>Nascimento</surname><given-names>GG</given-names> </name><etal/></person-group><article-title>Federated and distributed learning applications for electronic health records and structured medical data: a scoping review</article-title><source>J Am Med Inform Assoc</source><year>2023</year><month>11</month><day>17</day><volume>30</volume><issue>12</issue><fpage>2041</fpage><lpage>2049</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocad170</pub-id><pub-id pub-id-type="medline">37639629</pub-id></nlm-citation></ref><ref id="ref83"><label>83</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shiri</surname><given-names>I</given-names> </name><name name-style="western"><surname>Salimi</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Maghsudi</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Differential privacy preserved federated transfer learning for multi-institutional <sup>68</sup>Ga-PET image artefact detection and disentanglement</article-title><source>Eur J Nucl Med Mol Imaging</source><year>2023</year><month>12</month><volume>51</volume><issue>1</issue><fpage>40</fpage><lpage>53</lpage><pub-id pub-id-type="doi">10.1007/s00259-023-06418-7</pub-id><pub-id pub-id-type="medline">37682303</pub-id></nlm-citation></ref><ref id="ref84"><label>84</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Haltaufderheide</surname><given-names>J</given-names> </name><name name-style="western"><surname>Ranisch</surname><given-names>R</given-names> </name></person-group><article-title>The ethics of ChatGPT in medicine and healthcare: a systematic review on large language models (LLMs)</article-title><source>NPJ Digit Med</source><year>2024</year><month>07</month><day>8</day><volume>7</volume><issue>1</issue><fpage>183</fpage><pub-id pub-id-type="doi">10.1038/s41746-024-01157-x</pub-id><pub-id pub-id-type="medline">38977771</pub-id></nlm-citation></ref><ref id="ref85"><label>85</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>CK</given-names> </name><name name-style="western"><surname>Ke</surname><given-names>CR</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>MS</given-names> </name><etal/></person-group><article-title>Using large language models for efficient cancer registry coding in the real hospital setting: a feasibility study</article-title><source>Pac Symp Biocomput</source><year>2025</year><volume>30</volume><fpage>121</fpage><lpage>137</lpage><pub-id pub-id-type="doi">10.1142/9789819807024_0010</pub-id><pub-id pub-id-type="medline">39670366</pub-id></nlm-citation></ref><ref id="ref86"><label>86</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moore</surname><given-names>CL</given-names> </name><name name-style="western"><surname>Socrates</surname><given-names>V</given-names> </name><name name-style="western"><surname>Hesami</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Using natural language processing to identify emergency department patients with incidental lung nodules requiring follow-up</article-title><source>Acad Emerg Med</source><year>2025</year><month>03</month><volume>32</volume><issue>3</issue><fpage>274</fpage><lpage>283</lpage><pub-id pub-id-type="doi">10.1111/acem.15080</pub-id><pub-id pub-id-type="medline">39821298</pub-id></nlm-citation></ref><ref id="ref87"><label>87</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Geevarghese</surname><given-names>R</given-names> </name><name name-style="western"><surname>Solomon</surname><given-names>SB</given-names> </name><name name-style="western"><surname>Alexander</surname><given-names>ES</given-names> </name><etal/></person-group><article-title>Utility of a large language model for extraction of clinical findings from healthcare data following lung ablation: a feasibility study</article-title><source>J Vasc Interv Radiol</source><year>2025</year><month>04</month><volume>36</volume><issue>4</issue><fpage>704</fpage><lpage>708</lpage><pub-id pub-id-type="doi">10.1016/j.jvir.2024.11.029</pub-id><pub-id pub-id-type="medline">39662619</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Specific quality evaluation items and results.</p><media xlink:href="jmir_v27i1e74177_app1.docx" xlink:title="DOCX File, 47 KB"/></supplementary-material><supplementary-material id="app2"><label>Checklist 1</label><p>PRISMA checklist.</p><media xlink:href="jmir_v27i1e74177_app2.docx" xlink:title="DOCX File, 272 KB"/></supplementary-material></app-group></back></article>