<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="review-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id><journal-id journal-id-type="publisher-id">jmir</journal-id><journal-id journal-id-type="index">1</journal-id><journal-title>Journal of Medical Internet Research</journal-title><abbrev-journal-title>J Med Internet Res</abbrev-journal-title><issn pub-type="epub">1438-8871</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v28i1e77593</article-id><article-id pub-id-type="doi">10.2196/77593</article-id><article-categories><subj-group subj-group-type="heading"><subject>Review</subject></subj-group></article-categories><title-group><article-title>Accuracy of Deep Learning for Detecting Axillary Lymph Node Metastasis in Breast Cancer: Systematic Review and Meta-Analysis</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Wang</surname><given-names>Xueying</given-names></name><degrees>MMed</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Li</surname><given-names>Tiantian</given-names></name><degrees>MMed</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Wang</surname><given-names>Xiaohang</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name name-style="western"><surname>Fu</surname><given-names>Deyuan</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Breast Surgery, Northern Jiangsu People's Hospital Affiliated to Yangzhou University</institution><addr-line>No.98 Nantong West Road, Guangling District</addr-line><addr-line>Yangzhou</addr-line><country>China</country></aff><aff id="aff2"><institution>Department of Ultrasonography, Northern Jiangsu People's Hospital Affiliated to Yangzhou University</institution><addr-line>Yangzhou</addr-line><country>China</country></aff><aff id="aff3"><institution>Institute of Translational Medicine, Jiangsu Key Laboratory of Integrated Traditional Chinese and Western Medicine for Prevention and Treatment of Senile Diseases, Medical College, Yangzhou University</institution><addr-line>Yangzhou</addr-line><country>China</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Coristine</surname><given-names>Andrew</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Ahmadzadeh</surname><given-names>Amir Mahmoud</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Beltr&#x00E3;o</surname><given-names>Monique</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Deyuan Fu, PhD, Department of Breast Surgery, Northern Jiangsu People's Hospital Affiliated to Yangzhou University, No.98 Nantong West Road, Guangling District, Yangzhou, 225001, China, 86 18051060677; <email>18051060677@yzu.edu.cn</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>16</day><month>4</month><year>2026</year></pub-date><volume>28</volume><elocation-id>e77593</elocation-id><history><date date-type="received"><day>16</day><month>05</month><year>2025</year></date><date date-type="rev-recd"><day>27</day><month>02</month><year>2026</year></date><date date-type="accepted"><day>27</day><month>02</month><year>2026</year></date></history><copyright-statement>&#x00A9; Xueying Wang, Tiantian Li, Xiaohang Wang, Deyuan Fu. Originally published in the Journal of Medical Internet Research (<ext-link ext-link-type="uri" xlink:href="https://www.jmir.org">https://www.jmir.org</ext-link>), 16.4.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.jmir.org/">https://www.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://www.jmir.org/2026/1/e77593"/><abstract><sec><title>Background</title><p>Axillary lymph node metastasis (ALNM) is an important factor in detecting breast cancer (BC). However, the noninvasive diagnosis of ALNM remains challenging. While some deep learning (DL) models have been developed for preoperative ALNM assessment, their performance lacks systematic evaluation.</p></sec><sec><title>Objective</title><p>This study aims to evaluate the effectiveness of DL in detecting ALNM, providing evidence to support clinical diagnostic tools.</p></sec><sec sec-type="methods"><title>Methods</title><p>Embase, Web of Science, PubMed, and Cochrane Library were searched from their inception through January 26, 2026. The Quality Assessment of Diagnostic Accuracy Studies was used to assess the risk of bias in the included studies. A bivariate mixed effects model was applied for analysis, and subgroup analyses were conducted based on different imaging modalities.</p></sec><sec sec-type="results"><title>Results</title><p>This meta-analysis included 28 independent studies and pooled data from 20,811 patients with BC. Among them, 7123 cases had confirmed ALNM. The overall diagnostic performance of the DL model (bivariate mixed effects) for detecting ALNM in BC was as follows: sensitivity 0.80 (95% CI 0.76&#x2010;0.84), specificity 0.85 (95% CI 0.80&#x2010;0.88), diagnostic odds ratio (DOR) 22 (95% CI 16&#x2010;30), and area under the summary receiver operating characteristic curve (AUC) 0.89 (95% CI 0.86&#x2010;0.92). The positive likelihood ratio (LR+) was 5.2 (95% CI 4.1&#x2010;6.5), and the negative likelihood ratio (LR&#x2212;) was 0.24 (95% CI 0.19&#x2010;0.29). For ultrasound-based DL models targeting ALNM detection, the pooled sensitivity and specificity were 0.79 (95% CI 0.72&#x2010;0.84) and 0.86 (95% CI 0.79&#x2010;0.91), respectively. Diagnostic performance metrics showed an LR+ of 5.5 (95% CI 3.8&#x2010;8.1), an LR&#x2212; of 0.25 (95% CI 0.19&#x2010;0.32), a DOR of 22 (95% CI 15&#x2010;33), and an AUC of 0.89 (95% CI 0.86&#x2010;0.91). Regarding magnetic resonance imaging&#x2013;based DL models for detecting ALNM, the pooled sensitivity was 0.78 (95% CI 0.71&#x2010;0.83) and the pooled specificity was 0.82 (95% CI 0.76&#x2010;0.87). Corresponding metrics included an LR+ of 4.4 (95% CI 3.3&#x2010;5.9), an LR&#x2212; of 0.27 (95% CI 0.21&#x2010;0.35), a DOR of 16 (95% CI 11&#x2010;25), and an AUC of 0.87 (95% CI 0.84&#x2010;0.90). For computed tomography (CT)&#x2013;based models, the sensitivity was 0.90 (95% CI 0.78&#x2010;0.96), the specificity was 0.88 (95% CI 0.84&#x2010;0.92), and the AUC was as high as 0.91 (95% CI 0.89&#x2010;0.94).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Current DL methods for detecting ALNM in BC primarily utilize ultrasound, magnetic resonance imaging, and CT. DL models based on all 3 modalities demonstrated good diagnostic performance. CT had the highest sensitivity and AUC, while its specificity was comparable to that of ultrasound. These findings provide supportive evidence for the development or optimization of clinical diagnostic models.</p></sec><sec><title>Trial Registration</title><p>PROSPERO CRD42024609828; https://www.crd.york.ac.uk/PROSPERO/view/CRD42024609828</p></sec></abstract><kwd-group><kwd>breast cancer</kwd><kwd>axillary lymph node metastasis</kwd><kwd>deep learning</kwd><kwd>systematic review</kwd><kwd>ultrasound</kwd><kwd>magnetic resonance imaging</kwd><kwd>computed tomography</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Breast cancer (BC) is a common and life-threatening tumor in women. According to the latest global statistics of 2025, there were 2.3 million new BC cases (accounting for 25% of all new cancer cases among women) and 670,000 BC-related deaths (accounting for 15.5% of cancer deaths in women) worldwide in 2022. By 2050, new cases of BC are projected to rise by 38%, while BC deaths are expected to increase by 68%, with the fastest growth observed in low- and middle-income countries [<xref ref-type="bibr" rid="ref1">1</xref>]. The incidence of BC varies notably by region. New Zealand and Australia have the highest incidence of BC, with an age-standardized incidence rate of 100.3 per 100,000, while South Asia has the lowest rate at 26.7 per 100,000 [<xref ref-type="bibr" rid="ref1">1</xref>]. Moreover, the incidence of BC is rising at approximately 0.6% per year and is trending toward a younger age at onset [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. Consequently, BC has emerged as a severe disease burden on society. BC treatment includes local and systemic therapies, with surgery, radiotherapy, and chemotherapy as the primary therapeutic approaches. Currently, immunotherapy [<xref ref-type="bibr" rid="ref4">4</xref>], brachytherapy [<xref ref-type="bibr" rid="ref5">5</xref>], and neoadjuvant therapy [<xref ref-type="bibr" rid="ref6">6</xref>] have significantly improved the clinical outcomes and prolonged the survival of patients with BC. However, some patients still experience poor prognoses due to influencing factors, such as axillary lymph node metastasis (ALNM), molecular subtypes, and lymphovascular invasion. As ALNM can elevate the risk of recurrence and metastasis of BC, it is an important factor for assessing the treatment and prognosis of BC [<xref ref-type="bibr" rid="ref7">7</xref>]. Currently, the accurate detection of ALNM before BC surgery remains challenging. Although techniques including fine-needle aspiration cytology and core needle biopsy can be used in clinical practice, these invasive procedures may lead to complications such as implantation metastasis and hematoma. Moreover, these procedures may cause false negatives, thereby affecting diagnostic accuracy and timely treatment. Thus, developing a preoperative, efficient, accurate, and safe method for detecting ALNM is of great clinical significance for improving the diagnostic and prognostic evaluation of patients with BC. Furthermore, it serves as a critical research topic that requires in-depth exploration.</p><p>With advances in machine learning (ML), many researchers have applied ML approaches to oncology. ML can integrate high-dimensional data, including clinical features, gene expression, and imaging characteristics, to construct models for diagnosing disease, assessing progression, and evaluating prognosis [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref10">10</xref>]. Traditional ML depends on manual coding and requires variable selection, image segmentation, and extraction of image features using specialized software (eg, 3D Slicer [Slicer Community] and ITK-SNAP [Penn Image Computing and Science Laboratory]). The features are then imported into ML for filtering, modeling, and validation. However, information may be lost during the extraction and screening process. Although deep learning (DL) can automatically train on images, it still relies on manual segmentation for model construction in current research. DL can directly train models based on segmented images. Therefore, this technique preserves maximal information, enhancing the diagnostic accuracy [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref13">13</xref>]. Accordingly, some researchers have developed image-based DL models [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref16">16</xref>] to improve the preoperative diagnosis of ALNM. Nonetheless, systematic evidence on the accuracy of DL for detecting ALNM remains limited. Therefore, this study aims to evaluate the performance of current image-based DL models for detecting ALNM in BC and provide evidence-based insights for developing or updating intelligent diagnostic tools for clinical practice.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Registration</title><p>This study was performed in accordance with the PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) 2020 guidelines (<xref ref-type="supplementary-material" rid="app2">Checklist 1</xref>) and was registered in the PROSPERO (Prospective Register of Systematic Reviews) database (ID CRD42024609828).</p></sec><sec id="s2-2"><title>Eligibility Criteria</title><p>The eligibility criteria were established as the basis for subsequent literature screening as shown in <xref ref-type="table" rid="table1">Table 1</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Eligibility criteria for study inclusion in the systematic review and meta-analysis of DL<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> models for detecting ALNM<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup> status in patients with BC<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup>.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">PICOS</td><td align="left" valign="bottom">Inclusion criteria</td><td align="left" valign="bottom">Exclusion criteria</td></tr></thead><tbody><tr><td align="left" valign="top">Participants (P)</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Studies involving patients with BC</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Studies that did not strictly differentiate BC from other tumors</p></list-item></list></td></tr><tr><td align="left" valign="top">Intervention (I)</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Studies that developed DL models for ALNM detection</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Studies that only applied traditional ML<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></p></list-item><list-item><p>Studies that only performed image segmentation without constructing a DL model</p></list-item></list></td></tr><tr><td align="left" valign="top">Comparison (C)</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>None</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>None</p></list-item></list></td></tr><tr><td align="left" valign="top">Outcomes (O)</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Studies that reported metrics for evaluating ML model performance (eg, sensitivity, specificity, area under the summary receiver operating characteristic curve, negative likelihood ratio, positive likelihood ratio, and diagnostic odds ratio)</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Studies that did not report the aforementioned performance metrics</p></list-item></list></td></tr><tr><td align="left" valign="top">Study design (S)</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Case-control, cohort, or cross-sectional studies</p></list-item><list-item><p>Studies published in English</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Conference abstracts, guidelines, meta-analyses, reviews, or expert opinions</p></list-item><list-item><p>Lymph node status not confirmed by biopsy</p></list-item><list-item><p>No clear differentiation between the sentinel and axillary lymph nodes</p></list-item></list></td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>DL: deep learning.</p></fn><fn id="table1fn2"><p><sup>b</sup>ALNM: axillary lymph node metastasis.</p></fn><fn id="table1fn3"><p><sup>c</sup>BC: breast cancer.</p></fn><fn id="table1fn4"><p><sup>d</sup>ML: machine learning.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-3"><title>Data Sources and Search Strategy</title><p>Web of Science, Cochrane Library, PubMed, and Embase were searched from their inception up to January 26, 2026. The search strategy was designed by combining free-text terms and subject headings. There were no temporal or geographical restrictions. The search strategy is illustrated in Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-4"><title>Study Selection and Data Extraction</title><p>Initially retrieved studies were imported into EndNote. After removing duplicates, the titles and abstracts of the remaining studies were further reviewed. After a full-text review, eligible studies were selected. Data extraction was performed using a standardized form. The extracted information included digital object identifier, publication year, patient source, country, title, study design, first author, number of ALNM cases, total cases, number of ALNM cases within the training cohort, total cases within the training cohort, number of ALNM cases within the validation cohort, total cases within the validation cohort, methods used to generate the validation cohort, whether region of interest segmentation was performed, model type, and whether a clinical comparison was conducted. Two reviewers independently selected the studies and extracted the data. Disagreements were resolved through consultation with a third reviewer.</p></sec><sec id="s2-5"><title>Risk of Bias in Included Studies</title><p>The risk of bias (RoB) of the included studies was assessed using the Quality Assessment of Diagnostic Accuracy Studies [<xref ref-type="bibr" rid="ref17">17</xref>]. This tool assessed overall bias and clinical applicability in 4 domains: index test, flow and timing, reference standard, and patient selection. Each domain was rated as low, high, or unclear RoB according to specific criteria. Two reviewers independently assessed the RoB and cross-checked the evaluation results. Disagreements were resolved through consultation with a third reviewer.</p></sec><sec id="s2-6"><title>Synthesis Methods</title><p>Data analysis was performed using Stata 15.0 (StataCorp LLC). A bivariate mixed effects (BME) model was used to explore the nonlinear relationship between sensitivity and specificity. The model estimated the following along with their corresponding 95% CIs: pooled sensitivity, specificity, area under the summary receiver operating characteristic curve (AUC), negative likelihood ratio (LR&#x2212;), positive likelihood ratio (LR+), and diagnostic odds ratio (DOR). Publication bias was evaluated using the Deeks funnel plot. Sensitivity and specificity were derived from a 2&#x00D7;2 contingency table. Since most studies did not report contingency tables, the pooled sensitivity, specificity, precision, and case numbers were used for calculations. In the validation phase, a meta-analysis was conducted. When multiple validation sets were available within a single investigation, all were incorporated into the analysis. Subgroup analyses were performed, stratified by image type and validation set generation method. Furthermore, the analysis aggregated the outcomes from both internal and external validations for DL models developed using ultrasound, magnetic resonance imaging (MRI), and computed tomography (CT). Moreover, for studies with multiple validation cohorts, only the cohort with the highest Youden index was retained to ensure that a single validation cohort was retained in each study for the sensitivity analysis. The meta-analysis was then repeated with this reduced dataset. A <italic>P</italic> value &#x003C;.05 was considered statistically significant.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Study Selection</title><p>A total of 2225 studies were selected from the databases, among which 521 duplicates were removed. Following a title and abstract screening, 1659 studies were further excluded. The full texts of the remaining 45 studies were assessed, and 17 studies were removed for the following reasons: inaccessible conference abstracts (n=4), absence of outcome indicators for assessing the accuracy of DL (n=6), sole focus on image segmentation (n=2), use of positron emission tomography-CT as the diagnostic gold standard (n=1), and lack of clear differentiation between sentinel and axillary lymph nodes (n=4). Ultimately, 28 studies [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref43">43</xref>] were included in the analysis. The study screening process is illustrated in <xref ref-type="fig" rid="figure1">Figure 1</xref>.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) flow diagram illustrating the identification and selection process of studies evaluating DL models for the preoperative diagnosis of ALNM in BC. Data sources: Web of Science, Cochrane Library, PubMed, and Embase (search date: January 26, 2026). ALNM: axillary lymph node metastasis; BC: breast cancer; PET-CT: positron emission tomography-computed tomography.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e77593_fig01.png"/></fig></sec><sec id="s3-2"><title>Study Characteristics</title><p>A total of 28 studies published between 2018 and 2026 were included. These studies involved 20,811 patients with BC, 7123 of whom had ALNM. Twenty-three of the studies were from China, 3 from the United States, 1 from Italy, and 1 from Korea. All of the studies used a case-control design. Seventeen of the studies were single-center, and 11 were multicenter. Regarding imaging modalities, 10 studies utilized MRI, 14 used ultrasound images, and 4 used CT scans. All 28 studies clearly described their validation methods. Twenty studies employed random sampling, 10 used external validation, and 3 utilized cross-validation. Twenty-three studies conducted manual segmentation, and 7 reported the comparisons between DL models and clinical physicians (<xref ref-type="table" rid="table2">Table 2</xref>).</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Characteristics of the 28 included studies on DL<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup> for ALNM<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup> in patients with BC<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup> published between 2018 and 2026<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup>.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">No.</td><td align="left" valign="bottom">Included study and year of publication</td><td align="left" valign="bottom">Country of the author</td><td align="left" valign="bottom">Study type</td><td align="left" valign="bottom">Patient source</td><td align="left" valign="bottom">Modality</td><td align="left" valign="bottom">Number of lymph node metastasis cases</td><td align="left" valign="bottom">Total number of cases</td><td align="left" valign="bottom">Total number of cases in the training set</td><td align="left" valign="bottom">Generation method of the validation set</td><td align="left" valign="bottom">Number of cases in the validation set</td><td align="left" valign="bottom">Whether region of interest segmentation is used or not</td><td align="left" valign="bottom">Segmentation method</td><td align="left" valign="bottom">Network architecture</td><td align="left" valign="bottom">Network input</td><td align="left" valign="bottom">Comparison with clinicians</td></tr></thead><tbody><tr><td align="left" valign="top">1</td><td align="left" valign="top">Gong et al [<xref ref-type="bibr" rid="ref18">18</xref>] (2025)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Single center</td><td align="left" valign="top">US<sup><xref ref-type="table-fn" rid="table2fn5">e</xref></sup></td><td align="left" valign="top">312</td><td align="left" valign="top">1280</td><td align="left" valign="top">921</td><td align="left" valign="top">Random sampling, temporal validation</td><td align="left" valign="top">I1<sup><xref ref-type="table-fn" rid="table2fn6">f</xref></sup>: 102; I2: 257</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">Transformer</td><td align="left" valign="top">2D</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">2</td><td align="left" valign="top">Agyekum et al [<xref ref-type="bibr" rid="ref19">19</xref>] (2025)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Multicenter</td><td align="left" valign="top">US</td><td align="left" valign="top">295</td><td align="left" valign="top">820</td><td align="left" valign="top">621</td><td align="left" valign="top">External validation</td><td align="left" valign="top">E1<sup><xref ref-type="table-fn" rid="table2fn7">g</xref></sup>: 112;<break/>E2: 87</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">ResNet50<sup><xref ref-type="table-fn" rid="table2fn8">h</xref></sup> and GCN<sup><xref ref-type="table-fn" rid="table2fn9">i</xref></sup></td><td align="left" valign="top">2D</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">3</td><td align="left" valign="top">Li et al [<xref ref-type="bibr" rid="ref20">20</xref>] (2025)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Multicenter</td><td align="left" valign="top">US</td><td align="left" valign="top">1013</td><td align="left" valign="top">1557</td><td align="left" valign="top">1144</td><td align="left" valign="top">Random sampling, external validation</td><td align="left" valign="top">I: 273;<break/>E: 140</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">Transformer</td><td align="left" valign="top">2D</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">4</td><td align="left" valign="top">Gu et al [<xref ref-type="bibr" rid="ref21">21</xref>] (2025)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Multicenter</td><td align="left" valign="top">MRI<sup><xref ref-type="table-fn" rid="table2fn10">j</xref></sup></td><td align="left" valign="top">201</td><td align="left" valign="top">520</td><td align="left" valign="top">287</td><td align="left" valign="top">Random sampling, external validation</td><td align="left" valign="top">I: 124;<break/>E: 109</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Semiautomatic</td><td align="left" valign="top">Convolutional neural network (CNN)</td><td align="left" valign="top">3D</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">5</td><td align="left" valign="top">Dai et al [<xref ref-type="bibr" rid="ref22">22</xref>] (2025)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Multicenter</td><td align="left" valign="top">MRI</td><td align="left" valign="top">386</td><td align="left" valign="top">935</td><td align="left" valign="top">742</td><td align="left" valign="top">Random sampling</td><td align="left" valign="top">I: 83;<break/>E: 110</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">3D ResNet, 3D-Xception, and HRNet<sup><xref ref-type="table-fn" rid="table2fn11">k</xref></sup></td><td align="left" valign="top">2D</td><td align="left" valign="top">Yes</td></tr><tr><td align="left" valign="top">6</td><td align="left" valign="top">Sun et al [<xref ref-type="bibr" rid="ref23">23</xref>] (2025)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Single center</td><td align="left" valign="top">CT<sup><xref ref-type="table-fn" rid="table2fn12">l</xref></sup></td><td align="left" valign="top">91</td><td align="left" valign="top">258</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Random sampling</td><td align="left" valign="top">Not reported</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">ResNet101</td><td align="left" valign="top">2D</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">7</td><td align="left" valign="top">Wang et al [<xref ref-type="bibr" rid="ref24">24</xref>] (2024)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Single center</td><td align="left" valign="top">US</td><td align="left" valign="top">67</td><td align="left" valign="top">266</td><td align="left" valign="top">212</td><td align="left" valign="top">Random sampling</td><td align="left" valign="top">I: 27;<break/>T: 27(3)</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Automatic</td><td align="left" valign="top">DeepLabV3+, ResNet-101, and CNN</td><td align="left" valign="top">2D</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">8</td><td align="left" valign="top">Polat et al [<xref ref-type="bibr" rid="ref25">25</xref>] (2024)</td><td align="left" valign="top">America</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Single center</td><td align="left" valign="top">MRI</td><td align="left" valign="top">152</td><td align="left" valign="top">253</td><td align="left" valign="top">All cases</td><td align="left" valign="top">Cross-validation (2)</td><td align="left" valign="top">All cases</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">CNN</td><td align="left" valign="top">3D</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">9</td><td align="left" valign="top">Zhou et al [<xref ref-type="bibr" rid="ref26">26</xref>] (2024)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Multicenter</td><td align="left" valign="top">MRI</td><td align="left" valign="top">530</td><td align="left" valign="top">1259</td><td align="left" valign="top">801</td><td align="left" valign="top">Random sampling</td><td align="left" valign="top">I: 344;<break/>E: 114</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">ResNet101, ResNeXt101, and DenseNet<sup><xref ref-type="table-fn" rid="table2fn13">m</xref></sup></td><td align="left" valign="top">2D</td><td align="left" valign="top">Yes</td></tr><tr><td align="left" valign="top">10</td><td align="left" valign="top">Park et al [<xref ref-type="bibr" rid="ref14">14</xref>] (2024)</td><td align="left" valign="top">Korea</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Single center</td><td align="left" valign="top">CT</td><td align="left" valign="top">303</td><td align="left" valign="top">523</td><td align="left" valign="top">417</td><td align="left" valign="top">Random sampling</td><td align="left" valign="top">I1: 53; I2: 53</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">DenseNet 121</td><td align="left" valign="top">2D axial CT slice</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">11</td><td align="left" valign="top">Liu et al [<xref ref-type="bibr" rid="ref27">27</xref>] (2024)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Multicenter</td><td align="left" valign="top">US</td><td align="left" valign="top">327</td><td align="left" valign="top">883</td><td align="left" valign="top">621</td><td align="left" valign="top">External validation</td><td align="left" valign="top">E1: 112;<break/>E2: 87;<break/>E3: 63</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">ResNet50</td><td align="left" valign="top">2D US image</td><td align="left" valign="top">Yes</td></tr><tr><td align="left" valign="top">12</td><td align="left" valign="top">Guo et al [<xref ref-type="bibr" rid="ref28">28</xref>] (2024)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Multicenter</td><td align="left" valign="top">MRI</td><td align="left" valign="top">1064</td><td align="left" valign="top">2063</td><td align="left" valign="top">1256</td><td align="left" valign="top">Random sampling, external validation</td><td align="left" valign="top">I: 539;<break/>E1: 153;<break/>E2: 115</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">Convolutional recurrent neural network</td><td align="left" valign="top">2D image</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">13</td><td align="left" valign="top">Wei et al [<xref ref-type="bibr" rid="ref29">29</xref>] (2023)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Single center</td><td align="left" valign="top">US</td><td align="left" valign="top">349</td><td align="left" valign="top">892</td><td align="left" valign="top">535</td><td align="left" valign="top">Random sampling</td><td align="left" valign="top">I1: 178;<break/>I2: 179</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">Inception_v3, ResNet101, ResNet50, VGG19<sup><xref ref-type="table-fn" rid="table2fn14">n</xref></sup>, and<break/>Wide_resnet50_v2</td><td align="left" valign="top">2D grayscale image</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">14</td><td align="left" valign="top">Li et al [<xref ref-type="bibr" rid="ref16">16</xref>] (2023)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Multicenter</td><td align="left" valign="top">US</td><td align="left" valign="top">127</td><td align="left" valign="top">320</td><td align="left" valign="top">210</td><td align="left" valign="top">External validation</td><td align="left" valign="top">I: 61;<break/>E: 49</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Automatic</td><td align="left" valign="top">CNN (R2+1D, TIN<sup><xref ref-type="table-fn" rid="table2fn15">o</xref></sup>, ResNet-3D)</td><td align="left" valign="top">Video sequence (3D)</td><td align="left" valign="top">Yes</td></tr><tr><td align="left" valign="top">15</td><td align="left" valign="top">Gao et al [<xref ref-type="bibr" rid="ref30">30</xref>] (2023)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Multicenter</td><td align="left" valign="top">MRI</td><td align="left" valign="top">387</td><td align="left" valign="top">941</td><td align="left" valign="top">742</td><td align="left" valign="top">Random sampling, external validation</td><td align="left" valign="top">I: 83;<break/>E: 116</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">3D ResNet + CBAM<sup><xref ref-type="table-fn" rid="table2fn16">p</xref></sup></td><td align="left" valign="top">3D DCE<sup><xref ref-type="table-fn" rid="table2fn17">q</xref></sup>-MRI volume data</td><td align="left" valign="top">Yes</td></tr><tr><td align="left" valign="top">16</td><td align="left" valign="top">Zhang et al [<xref ref-type="bibr" rid="ref31">31</xref>] (2022)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Single center</td><td align="left" valign="top">MRI</td><td align="left" valign="top">98</td><td align="left" valign="top">252</td><td align="left" valign="top">202</td><td align="left" valign="top">Random sampling</td><td align="left" valign="top">50</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">ResNet50</td><td align="left" valign="top">2D</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">17</td><td align="left" valign="top">Zhang et al [<xref ref-type="bibr" rid="ref32">32</xref>] (2022)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Single center</td><td align="left" valign="top">US</td><td align="left" valign="top">394</td><td align="left" valign="top">952</td><td align="left" valign="top">902</td><td align="left" valign="top">External validation</td><td align="left" valign="top">50</td><td align="left" valign="top">No</td><td align="left" valign="top">None</td><td align="left" valign="top">CNN</td><td align="left" valign="top">2D</td><td align="left" valign="top">Yes</td></tr><tr><td align="left" valign="top">18</td><td align="left" valign="top">Wang et al [<xref ref-type="bibr" rid="ref33">33</xref>] (2022)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Single center</td><td align="left" valign="top">MRI</td><td align="left" valign="top">163</td><td align="left" valign="top">348</td><td align="left" valign="top">315</td><td align="left" valign="top">Random sampling</td><td align="left" valign="top">33</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">ResNet50</td><td align="left" valign="top">2D</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">19</td><td align="left" valign="top">Sun et al [<xref ref-type="bibr" rid="ref34">34</xref>] (2022)</td><td align="left" valign="top">America</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Single center</td><td align="left" valign="top">US</td><td align="left" valign="top">64</td><td align="left" valign="top">169</td><td align="left" valign="top">All cases</td><td align="left" valign="top">Cross-validation</td><td align="left" valign="top">All cases</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">Custom CNN and ResNet-101</td><td align="left" valign="top">2D</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">20</td><td align="left" valign="top">Santucci et al [<xref ref-type="bibr" rid="ref35">35</xref>] (2022)</td><td align="left" valign="top">Italy</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Single center</td><td align="left" valign="top">MRI</td><td align="left" valign="top">27</td><td align="left" valign="top">128</td><td align="left" valign="top">All cases</td><td align="left" valign="top">Cross-validation</td><td align="left" valign="top">All cases</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">SFB-NET<sup><xref ref-type="table-fn" rid="table2fn18">r</xref></sup>, VB-NET<sup><xref ref-type="table-fn" rid="table2fn19">s</xref></sup>, 2DS-NET<sup><xref ref-type="table-fn" rid="table2fn20">t</xref></sup> (optimal)</td><td align="left" valign="top">2D slice and 3D volume</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">21</td><td align="left" valign="top">Li et al [<xref ref-type="bibr" rid="ref36">36</xref>] (2022)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Single center</td><td align="left" valign="top">US</td><td align="left" valign="top">489</td><td align="left" valign="top">2131</td><td align="left" valign="top">1491</td><td align="left" valign="top">Random sampling</td><td align="left" valign="top">640</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">ResNet-50</td><td align="left" valign="top">2D</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">22</td><td align="left" valign="top">Cattell et al [<xref ref-type="bibr" rid="ref37">37</xref>] (2022)</td><td align="left" valign="top">America</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Single center</td><td align="left" valign="top">MRI</td><td align="left" valign="top">67</td><td align="left" valign="top">198</td><td align="left" valign="top">109</td><td align="left" valign="top">Random sampling</td><td align="left" valign="top">I1: 54;<break/>I2: 35</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">VGG16</td><td align="left" valign="top">2D</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">23</td><td align="left" valign="top">Zeng et al [<xref ref-type="bibr" rid="ref38">38</xref>] (2021)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Single center</td><td align="left" valign="top">CT</td><td align="left" valign="top">100</td><td align="left" valign="top">229</td><td align="left" valign="top">153</td><td align="left" valign="top">Random sampling</td><td align="left" valign="top">76</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">Custom CNN (decoupling convolution)</td><td align="left" valign="top">2D</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">24</td><td align="left" valign="top">Liu et al [<xref ref-type="bibr" rid="ref39">39</xref>] (2021)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Single center</td><td align="left" valign="top">CT</td><td align="left" valign="top">400</td><td align="left" valign="top">800</td><td align="left" valign="top">480</td><td align="left" valign="top">Random sampling</td><td align="left" valign="top">I1: 160;<break/>I2:160</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">DA-VGG19</td><td align="left" valign="top">2D</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">25</td><td align="left" valign="top">Zhou et al [<xref ref-type="bibr" rid="ref40">40</xref>] (2020)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Multicenter</td><td align="left" valign="top">US</td><td align="left" valign="top">420</td><td align="left" valign="top">834</td><td align="left" valign="top">680</td><td align="left" valign="top">Random sampling, external validation</td><td align="left" valign="top">I: 76;<break/>E: 78</td><td align="left" valign="top">No</td><td align="left" valign="top">None</td><td align="left" valign="top">Inception V3, Inception-ResNet V2, and ResNet-101</td><td align="left" valign="top">2D</td><td align="left" valign="top">Yes</td></tr><tr><td align="left" valign="top">26</td><td align="left" valign="top">Zheng et al [<xref ref-type="bibr" rid="ref41">41</xref>] (2020)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Single center</td><td align="left" valign="top">US</td><td align="left" valign="top">247</td><td align="left" valign="top">584</td><td align="left" valign="top">466</td><td align="left" valign="top">Random sampling</td><td align="left" valign="top">118</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">ResNet-50</td><td align="left" valign="top">2D</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">27</td><td align="left" valign="top">Sun et al [<xref ref-type="bibr" rid="ref42">42</xref>] (2020)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Single center</td><td align="left" valign="top">US</td><td align="left" valign="top">136</td><td align="left" valign="top">479</td><td align="left" valign="top">359</td><td align="left" valign="top">Random sampling</td><td align="left" valign="top">120</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">DenseNet-121</td><td align="left" valign="top">2D</td><td align="left" valign="top">No</td></tr><tr><td align="left" valign="top">28</td><td align="left" valign="top">Guo et al [<xref ref-type="bibr" rid="ref43">43</xref>] (2020)</td><td align="left" valign="top">China</td><td align="left" valign="top">Case-control</td><td align="left" valign="top">Multicenter</td><td align="left" valign="top">US</td><td align="left" valign="top">365</td><td align="left" valign="top">937</td><td align="left" valign="top">542</td><td align="left" valign="top">External validation</td><td align="left" valign="top">395</td><td align="left" valign="top">Yes</td><td align="left" valign="top">Manual</td><td align="left" valign="top">Custom CNN</td><td align="left" valign="top">2D</td><td align="left" valign="top">No</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>DL: deep learning.</p></fn><fn id="table2fn2"><p><sup>b</sup>ALNM: axillary lymph node metastasis.</p></fn><fn id="table2fn3"><p><sup>c</sup>BC: breast cancer.</p></fn><fn id="table2fn4"><p><sup>d</sup>The table details study design, patient source, imaging modality, and validation methods. The 8th, 19th, and 20th studies in the table employed cross-validation methodologies. In the 3 studies, all cases were used in both the training and validation sets, and the training and validation sets were not independently partitioned. The construction of 2&#x00D7;2 contingency tables was not possible due to missing data, and some study cohorts were not included in the statistical analysis.</p></fn><fn id="table2fn5"><p><sup>e</sup>US: ultrasound.</p></fn><fn id="table2fn6"><p><sup>f</sup>I: internal validation cohort.</p></fn><fn id="table2fn7"><p><sup>g</sup>E: external validation cohort.</p></fn><fn id="table2fn8"><p><sup>h</sup>ResNet50: Residual Network 50.</p></fn><fn id="table2fn9"><p><sup>i</sup>GCN: graph convolutional network.</p></fn><fn id="table2fn10"><p><sup>j</sup>MRI: magnetic resonance imaging.</p></fn><fn id="table2fn11"><p><sup>k</sup>HRNet: high-resolution network.</p></fn><fn id="table2fn12"><p><sup>l</sup>CT: computed tomography.</p></fn><fn id="table2fn13"><p><sup>m</sup>DenseNet: densely connected convolutional network.</p></fn><fn id="table2fn14"><p><sup>n</sup>VGG: Visual Geometry Group.</p></fn><fn id="table2fn15"><p><sup>o</sup>TIN: temporal interlacing network.</p></fn><fn id="table2fn16"><p><sup>p</sup>CBAM: convolutional block attention module.</p></fn><fn id="table2fn17"><p><sup>q</sup>DCE: dynamic contrast-enhanced.</p></fn><fn id="table2fn18"><p><sup>r</sup>SFB-NET: single fixed-size box network.</p></fn><fn id="table2fn19"><p><sup>s</sup>VB-NET: variable-size box network.</p></fn><fn id="table2fn20"><p><sup>t</sup>2DS-NET: 2-dimensional slice network.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-3"><title>RoB in Included Studies</title><sec id="s3-3-1"><title>Risk of Selection Bias and Outcome Assessment</title><p>All studies adopted consecutive sampling and applied image-based DL. Although these studies followed a case-control design, there was no bias in evaluating the performance of image-based DL. Therefore, the risk of selection bias was considered low as the case exclusions were reasonable. None of the studies described how the gold standard was interpreted. However, since this meta-analysis focused on artificial intelligence (AI)&#x2013;based DL, the interpretation of the reference standard had minimal impact on the role of DL in assessing positive events. Thus, the RoB in outcome assessment was considered low. The time interval between the reference standard and the index test was appropriate in all 28 studies, each of which used a single, consistent gold standard. Regarding patient flow, all studies were rated as having a low RoB.</p></sec><sec id="s3-3-2"><title>Concerns Regarding Applicability (High RoB)</title><p>However, 3 studies were rated as having a high RoB in the assessment of clinical applicability because they relied solely on cross-validation.</p></sec><sec id="s3-3-3"><title>Summary of Assessments</title><p>The RoB assessments are illustrated in <xref ref-type="fig" rid="figure2">Figures 2</xref> and <xref ref-type="fig" rid="figure3">3</xref>.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Summary of RoB, as assessed via the QUADAS-2 tool, for the 28 included case-control studies (2018&#x2010;2026) that evaluated the image-based DL models in detecting ALNM among patients with BC. The assessment across the 4 domains (patient selection, index test, reference standard, and flow and timing) indicates an overall low RoB. ALNM: axillary lymph node metastasis; BC: breast cancer; DL: deep learning; RoB: risk of bias; QUADAS: Quality Assessment of Diagnostic Accuracy Studies.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e77593_fig02.png"/></fig><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Overall low concerns regarding applicability identified by QUADAS-2 assessment of DL studies for ALNM diagnosis [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref36">36</xref>-<xref ref-type="bibr" rid="ref43">43</xref>]. Among the 28 studies evaluated, 3 studies that used only cross-validation raised concerns due to their limited generalizability to broader clinical practice. ALNM: axillary lymph node metastasis; DL: deep learning; QUADAS: Quality Assessment of Diagnostic Accuracy Studies.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e77593_fig03.png"/></fig></sec><sec id="s3-3-4"><title>Overall Model</title><p>Across all included studies, a total of 40 2&#x00D7;2 contingency tables from validation cohorts were utilized to evaluate the accuracy of DL in detecting ALNM, with an ALNM prevalence of 40.1%. The pooled results from the BME model were as follows: a sensitivity of 0.80 (95% CI 0.76&#x2010;0.84), a specificity of 0.85 (95% CI 0.80&#x2010;0.88), an LR+ of 5.2 (95% CI 4.1&#x2010;6.5), an LR&#x2212; of 0.24 (95% CI 0.19&#x2010;0.29), a DOR of 22 (95% CI 16&#x2010;30), and the AUC of 0.89 (95% CI 0.86&#x2010;0.92) (<xref ref-type="fig" rid="figure4">Figures 4</xref> and <xref ref-type="fig" rid="figure5">5</xref>). The Deeks funnel plot revealed no significant publication bias among the studies (<italic>P</italic>=.11) (<xref ref-type="fig" rid="figure6">Figure 6</xref>). Assuming a prior probability of 0.4, a positive test result corresponded to a true positive (TP) probability of 0.78 (<xref ref-type="fig" rid="figure7">Figure 7</xref>).</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Forest plots showing the pooled sensitivity and specificity of DL models for diagnosing ALNM [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref43">43</xref>]. The data were pooled from 40 validation cohorts across 28 studies, demonstrating an overall sensitivity of 0.80 (95% CI 0.76&#x2010;0.84) and a specificity of 0.85 (95% CI 0.80&#x2010;0.88). ALNM: axillary lymph node metastasis; DL: deep learning.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e77593_fig04.png"/></fig><p>The internal validation analysis used 26 diagnostic 4-fold tables to evaluate the accuracy of a DL model in detecting ALNM. The observed prevalence of ALNM was 39%. The BME model yielded the following pooled estimates: a sensitivity of 0.82 (95% CI 0.78&#x2010;0.85), a specificity of 0.85 (95% CI 0.82&#x2010;0.88), an LR+ of 5.6 (95% CI 4.4&#x2010;7.0), and an LR&#x2212; of 0.21 (95% CI 0.18&#x2010;0.26). The DOR was 26 (95% CI 18&#x2010;38), with an AUC of 0.90 (95% CI 0.87&#x2010;0.92) (Figures S1 and S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The Deeks funnel plot indicated no significant publication bias (<italic>P</italic>=.21) (Figure S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Assuming a prior probability of 0.4, a positive test result corresponded to a TP probability of 0.79 (Figure S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p><p>For the external validation, 14 diagnostic 4-fold tables were assessed, with an ALNM prevalence of 43%. The BME model demonstrated a pooled sensitivity of 0.78 (95% CI 0.66&#x2010;0.86), a specificity of 0.82 (95% CI 0.72&#x2010;0.90), an LR+ of 4.4 (95% CI 2.9&#x2010;6.8), an LR&#x2212; of 0.27 (95% CI 0.19&#x2010;0.39), a DOR of 16 (95% CI 10&#x2010;26), and an AUC of 0.87 (95% CI 0.84&#x2010;0.90; Figures S5 and S6 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The Deeks funnel plot indicated no significant publication bias (<italic>P</italic>=.16; Figure S7 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Assuming a prior probability of 0.4, a positive test result corresponded to a TP probability of 0.75 (Figure S8 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Summary receiver operating characteristic curve (with prediction and confidence contours) from the bivariate meta-analysis evaluating the diagnostic accuracy of DL models for detecting ALNM in BC. The curve is based on 40 contingency tables derived from the validation cohorts of the included studies. The analysis yielded a summary AUC of 0.89 (95% CI 0.86&#x2010;0.92). ALNM: axillary lymph node metastasis; AUC: area under the summary receiver operating characteristic curve; BC: breast cancer; DL: deep learning.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e77593_fig05.png"/></fig><fig position="float" id="figure6"><label>Figure 6.</label><caption><p>Assessment of potential publication bias using the Deeks funnel plot asymmetry test for the included studies on DL models in detecting ALNM in BC. The test indicated potential publication bias (<italic>P</italic>=.11). ALNM: axillary lymph node metastasis; BC: breast cancer; DL: deep learning; ESS: effective sample size.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e77593_fig06.png"/></fig><fig position="float" id="figure7"><label>Figure 7.</label><caption><p>Fagan nomogram illustrating the 78% posttest probability of ALNM following a positive DL model result, given a 40% pretest probability. ALNM: axillary lymph node metastasis; DL: deep learning; LR: likelihood ratio.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e77593_fig07.png"/></fig></sec><sec id="s3-3-5"><title>Conventional Ultrasound</title><p>Fourteen studies utilizing conventional ultrasound were included, which provided 20 distinct validation cohorts (due to multiple cohorts from several studies) for assessing DL models, with an ALNM prevalence of 38 %. The pooled results from the BME model were as follows: a sensitivity of 0.79 (95% CI 0.72&#x2010;0.84), a specificity of 0.86 (95% CI 0.79&#x2010;0.91), an LR+ of 5.5 (95% CI 3.8&#x2010;8.1), an LR&#x2212; of 0.25 (95% CI 0.19&#x2010;0.32), a DOR of 22 (95% CI 15&#x2010;33), and an AUC of 0.89 (95% CI 0.86&#x2010;0.91) (Figures S9 and S10 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The Deeks funnel plot demonstrated no significant publication bias (<italic>P</italic>=.22) (Figure S11 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Assuming a prior probability of 0.4, a positive test result corresponded to a TP probability of 0.79 (Figure S12 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p><p>The internal validation involved 11 diagnostic 4-fold tables to evaluate the accuracy of a DL model in detecting ALNM. The observed ALNM prevalence was 33%. The BME model yielded the following pooled estimates: a sensitivity of 0.80 (95% CI 0.76&#x2010;0.83), a specificity of 0.85 (95% CI 0.79&#x2010;0.90), an LR+ of 5.5 (95% CI 3.6&#x2010;8.3), an LR&#x2212; of 0.24 (95% CI 0.19&#x2010;0.29), a DOR of 23 (95% CI 13&#x2010;41), and an AUC of 0.85 (95% CI 0.81&#x2010;0.88) (Figures S13 and S14 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The Deeks funnel plot indicated no significant publication bias (<italic>P</italic>=.71) (Figure S15 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Assuming a prior probability of 0.4, a positive test result corresponded to a TP probability of 0.78 (Figure S16 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p><p>For the external validation, 9 diagnostic 4-fold tables were analyzed, with an ALNM prevalence of 47%. The BME model demonstrated a pooled sensitivity of 0.80 (95% CI 0.65&#x2010;0.90), a specificity of 0.85 (95% CI 0.71&#x2010;0.93), an LR+ of 5.4 (95% CI 2.9&#x2010;10.3), an LR&#x2212; of 0.23 (95% CI 0.13&#x2010;0.40), a DOR of 23 (95% CI 13&#x2010;44), and an AUC of 0.90 (95% CI 0.87&#x2010;0.92; Figures S17 and S18 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The Deeks funnel plot indicated no significant publication bias (<italic>P</italic>=.16; Figure S19 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Assuming a prior probability of 0.4, a positive test result corresponded to a TP probability of 0.78 (Figure S20 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p></sec><sec id="s3-3-6"><title>Magnetic Resonance Imaging</title><p>Ten studies evaluated DL models based on MRI, with an ALNM prevalence of 42%. The pooled results from the BME model were as follows: a sensitivity of 0.78 (95% CI 0.71&#x2010;0.83), a specificity of 0.82 (95% CI 0.76&#x2010;0.87), an LR+ of 4.4 (95% CI 3.3&#x2010;5.9), an LR&#x2212; of 0.27 (95% CI 0.21&#x2010;0.35), a DOR of 16 (95% CI 11&#x2010;25), and an AUC of 0.87 (95% CI 0.84&#x2010;0.90; Figures S21 and S22 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The Deeks funnel plot demonstrated no significant publication bias (<italic>P</italic>=.22; Figure S23 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Assuming a prior probability of 0.4, a positive test result corresponded to a TP probability of 0.75 (Figure S24 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p><p>The internal validation encompassed 11 diagnostic 4-fold tables to examine the accuracy of a DL model in detecting ALNM. The observed prevalence of ALNM was 44%. The BME model yielded the following pooled estimates: a sensitivity of 0.80 (95% CI 0.74&#x2010;0.86), a specificity of 0.84 (95% CI 0.79&#x2010;0.88), an LR+ of 4.9 (95% CI 3.7&#x2010;6.6), an LR&#x2212; of 0.23 (95% CI 0.17&#x2010;0.32), a DOR of 21 (95% CI 13&#x2010;35), and an AUC of 0.89 (95% CI 0.86&#x2010;0.92; Figures S25 and S26 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The Deeks funnel plot indicated no significant publication bias (<italic>P</italic>=.16; Figure S27 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Assuming a prior probability of 0.4, a positive test result corresponded to a TP probability of 0.77 (Figure S28 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p><p>The external validation cohorts for MRI consisted of 4 studies encompassing 5 distinct cohorts, with an ALNM prevalence of 37%. The pooled results were as follows: a sensitivity of 0.73 (95% CI 0.57&#x2010;0.85), a specificity of 0.78 (95% CI 0.61&#x2010;0.90), an LR+ of 3.4 (95% CI 2.0&#x2010;5.8), an LR&#x2212; of 0.35 (95% CI 0.23&#x2010;0.52), a DOR of 10 (95% CI 6&#x2010;17), and an AUC of 0.82 (95% CI 0.78&#x2010;0.85; Figures S29 and S30 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The Deeks funnel plot indicated no significant publication bias (<italic>P</italic>=.91; Figure S31 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Assuming a prior probability of 0.4, a positive test result corresponded to a TP probability of 0.69 (Figure S32 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p></sec><sec id="s3-3-7"><title>Computed Tomography</title><p>Regarding CT-based approaches, 4 studies developed DL models utilizing CT images. Of these, 3 studies were conducted in China and 1 in Korea. All 4 studies employed internal validation to generate their validation cohorts, with an ALNM prevalence of 43%. The pooled results were as follows: a sensitivity of 0.90 (95% CI 0.78&#x2010;0.96), a specificity of 0.88 (95% CI 0.84&#x2010;0.92), an LR+ of 7.8 (95% CI 5.3&#x2010;11.5), an LR&#x2212; of 0.11 (95% CI 0.05&#x2010;0.26), a DOR of 68 (95% CI 24&#x2010;196), and an AUC of 0.91 (95% CI 0.89&#x2010;0.94; Figures S33 and S34 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The Deeks funnel plot indicated no significant publication bias (<italic>P</italic>=.97; Figure S35 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Assuming a prior probability of 0.4, a positive test result corresponded to a TP probability of 0.84 (Figure S36 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p></sec></sec><sec id="s3-4"><title>Chinese Population</title><p>Fifteen studies, comprising 34 diagnostic 4-fold tables, validated DL models constructed using Chinese populations, with an ALNM prevalence of 40%. The pooled results from the BME model were as follows: a sensitivity of 0.80 (95% CI 0.76&#x2010;0.84), a specificity of 0.85 (95% CI 0.80&#x2010;0.88), an LR+ of 5.3 (95% CI 4.1&#x2010;6.8), an LR&#x2212; of 0.23 (95% CI 0.19&#x2010;0.28), a DOR of 23 (95% CI 16&#x2010;31), and an AUC of 0.89 (95% CI 0.86&#x2010;0.92; Figures S37 and S38 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The Deeks funnel plot revealed no significant publication bias (<italic>P</italic>=.08; Figure S39 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Assuming a prior probability of 0.4, a positive test result corresponded to a TP probability of 0.78 (Figure S40 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p></sec><sec id="s3-5"><title>Population of Other Countries</title><p>Six studies, comprising 5 diagnostic 4-fold tables, validated DL models constructed using non-Chinese populations, with an ALNM prevalence of 38%. The pooled results from the BME model were as follows: a sensitivity of 0.79 (95% CI 0.59&#x2010;0.90), a specificity of 0.84 (95% CI 0.78&#x2010;0.89), an LR+ of 5.0 (95% CI 3.5&#x2010;7.3), an LR&#x2212; of 0.25 (95% CI 0.12&#x2010;0.53), a DOR of 20 (95% CI 7&#x2010;53), and the AUC of 0.85 (95% CI 0.82&#x2010;0.88; Figures S41 and S42 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The Deeks funnel plot demonstrated no significant publication bias (<italic>P</italic>=.67; Figure S43 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Assuming a prior probability of 0.4, a positive test result corresponded to a TP probability of 0.77 (Figure S44 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p></sec><sec id="s3-6"><title>Sensitivity Analysis</title><p>A sensitivity analysis was conducted by retaining only 1 validation cohort per study. For studies with multiple cohorts, the validation cohort with the highest Youden index was selected.</p><sec id="s3-6-1"><title>Analysis Based on Conventional Ultrasound Studies</title><p>Fourteen studies utilizing conventional ultrasound were included in the assessment of DL models, with an ALNM prevalence of 34%. The pooled results from the BME model were as follows: a sensitivity of 0.79 (95% CI 0.73&#x2010;0.84), a specificity of 0.86 (95% CI 0.78&#x2010;0.92), an LR+ of 5.8 (95% CI 3.7&#x2010;9.1), an LR&#x2212; of 0.24 (95% CI 0.19&#x2010;0.31), a DOR of 24 (95% CI 14&#x2010;41), and an AUC of 0.88 (95% CI 0.85&#x2010;0.91; Figures S45 and S46 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The Deeks funnel plot demonstrated no significant publication bias (<italic>P</italic>=.24; Figure S47 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Assuming a prior probability of 0.4, a positive test result corresponded to a TP probability of 0.79 (Figure S48 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p></sec><sec id="s3-6-2"><title>Analysis Based on MRI Studies</title><p>Ten studies evaluated DL models based on MRI, with an ALNM prevalence of 44%. The pooled results from the BME model were as follows: a sensitivity of 0.82 (95% CI 0.75&#x2010;0.87), a specificity of 0.84 (95% CI 0.78&#x2010;0.88), an LR+ of 5.0 (95% CI 3.6&#x2010;6.8), an LR&#x2212; of 0.22 (95% CI 0.16&#x2010;0.30), a DOR of 22 (95% CI 13&#x2010;38), and an AUC of 0.90 (95% CI 0.87&#x2010;0.92; Figures S49 and S50 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The Deeks funnel plot demonstrated no significant publication bias (<italic>P</italic>=.11; Figure S51 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Assuming a prior probability of 0.4, a positive test result corresponded to a TP probability of 0.77 (Figure S52 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p></sec><sec id="s3-6-3"><title>Human Clinical Experts</title><p>Seven studies compared the diagnostic performance of human clinical experts in assessing the ALNM status based on imaging. Among them, 4 studies included 7 clinicians who differentiated ALNM using ultrasound. The pooled sensitivity was 0.65 (95% CI 0.59&#x2010;0.71), specificity was 0.75 (95% CI 0.70&#x2010;0.79), LR+ was 2.6 (95% CI 2.1&#x2010;3.2), LR&#x2212; was 0.46 (95% CI 0.39&#x2010;0.56), DOR was 6 (95% CI 4&#x2010;8), and the AUC was 0.76 (95% CI 0.20&#x2010;0.97; Figures S53 and S54 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The Deeks funnel plot showed no significant publication bias (<italic>P</italic>=.80; Figure S55 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Assuming a prior probability of 0.4, a positive test result corresponded to a TP probability of 0.63 (Figure S56 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Three investigations assessed the performance of human clinicians in diagnosing ALNM via MRI. In the study by Jing Gao et al [<xref ref-type="bibr" rid="ref30">30</xref>], 3 radiologists independently evaluated MRI scans for ALNM in the validation set, achieving sensitivities between 64.7% and 75.0% and specificities ranging from 70.6% to 83.8%. With the assistance of the attention-based DL model RCNet, diagnostic performance was markedly improved, resulting in sensitivities of 76.5% to 83.3% and specificities of 80.9% to 89.7%. In the study by Y. Dai et al, 3 human experts evaluated the diagnostic ability of MRI for lymph node metastasis in BC (a sample size of 110). The sensitivity ranged from 0.681 to 0.767, and the specificity ranged from 0.746 to 0.841. Furthermore, the study by Zhou et al [<xref ref-type="bibr" rid="ref26">26</xref>] found that 3 clinical experts achieved sensitivities ranging from 0.660 to 0.745 and specificities from 0.731 to 0.836 in detecting ALNM. When combined with DL, sensitivity increased to 0.787&#x2010;0.829 and specificity increased to 0.806&#x2010;0.895. These findings underscore the clinical utility of AI as an auxiliary diagnostic tool.</p></sec></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Main Findings of This Study</title><p>This meta-analysis revealed that DL approaches for detecting ALNM in BC primarily relied on MRI, ultrasound, and CT. The sensitivity and specificity for ultrasound-based DL models were 0.79 and 0.86, respectively. Meanwhile, the sensitivity and specificity of MRI-based models were 0.78 and 0.82, respectively. Furthermore, CT-based models demonstrated a sensitivity of 0.90 and a specificity of 0.88. The sensitivity of CT was superior to that of MRI and ultrasound, while no substantial differences in specificity were observed among the 3 modalities. These robust performance metrics validated the potential of DL as a complementary tool to conventional imaging assessments.</p></sec><sec id="s4-2"><title>Comparison With Previous Reviews</title><p>Currently, ML has gained widespread attention in the diagnosis and treatment of BC. Previous systematic reviews have evaluated the accuracy of ML models based on various imaging modalities. For instance, a meta-analysis by Jing Zhang et al [<xref ref-type="bibr" rid="ref44">44</xref>], which included 13 studies involving 1618 patients, demonstrated that dynamic contrast-enhanced MRI radiomics had promising diagnostic performance in detecting ALNM and sentinel lymph node metastasis in patients with BC. However, only 2 of these studies employed DL methods, and the pooled sensitivity and specificity were 0.84 (95% CI 0.53&#x2010;0.96) and 0.65 (95% CI 0.31&#x2010;0.89), respectively. The limited number of studies constrained the interpretation of the results. Another meta-analysis by Chen et al [<xref ref-type="bibr" rid="ref45">45</xref>], which included 14 studies, focused on ML-based MRI for diagnosing ALNM in patients with BC, and the pooled sensitivity and specificity were 0.79 (95% CI 0.74&#x2010;0.84) and 0.77 (95% CI 0.73&#x2010;0.81), respectively. This study primarily summarized models, such as support vector machines, logistic regression, and linear discriminant analysis, without specifically addressing the diagnostic accuracy of DL techniques. Eldaly et al [<xref ref-type="bibr" rid="ref46">46</xref>] systematically reviewed radiomics approaches for detecting ALNM. Their results revealed that the AUC of the included studies varied from 0.72 to 0.93. However, they did not provide a detailed summary of diagnostic performance, thus limiting the assessment of its true accuracy. Liu et al [<xref ref-type="bibr" rid="ref47">47</xref>] investigated the feasibility of AI algorithms based on CT and MRI for detecting ALNM in BC. They found that MRI-based methods demonstrated a sensitivity of 0.85 (95% CI 0.79&#x2010;0.90) and specificity of 0.81 (95% CI 0.66&#x2010;0.83), while CT-based methods showed a sensitivity of 0.88 (95% CI: 0.79&#x2010;0.94) and specificity of 0.80 (95%CI: 0.69&#x2010;0.88). A radiomics study [<xref ref-type="bibr" rid="ref48">48</xref>] included MRI, ultrasound, CT, and X-ray mammography. A meta-analysis of 30 studies involving a total of 5611 patients was conducted. The pooled sensitivity and specificity of radiomics for detecting ALNM were 0.86 (95% CI 0.82&#x2010;0.88) and 0.79 (95% CI 0.73&#x2010;0.84), respectively, demonstrating strong overall diagnostic accuracy. Gong et al [<xref ref-type="bibr" rid="ref48">48</xref>] comprehensively evaluated the performance of radiomics in detecting ALNM. Their results demonstrated an overall diagnostic accuracy of 23 (95% CI 16&#x2010;33) and a sensitivity of 0.86 (95% CI 0.82&#x2010;0.88). Radiomics serves as a promising noninvasive approach that can contribute to offering new quantitative modalities for disease diagnosis. However, their study did not strictly differentiate between types of ML, and different ML methods demonstrated varying performance in detecting positive events. Furthermore, there was no strict distinction between datasets in their study, with notable variations observed between the results in the training and validation sets.</p><p>With the advancement of AI, there has been a shift from traditional ML to DL. DL can analyze complex and diverse data, enabling personalized diagnosis and treatment that aligns with the current trend of precision medicine. Previous meta-analyses have lacked comprehensive evidence on DL models for detecting ALNM in patients with BC across various imaging modalities.</p><p>The present meta-analysis only included DL-based studies to minimize the variability of outcomes caused by different modalities. DL offers significant advantages over traditional ML with more advanced techniques for image processing, contributing to the development of diagnostic models for diseases [<xref ref-type="bibr" rid="ref37">37</xref>]. Our findings suggested that image-based DL for detecting ALNM in BC demonstrated favorable diagnostic performance. MRI, ultrasound, and CT are commonly used techniques for detecting ALNM in BC. However, MRI is not necessary or routinely used in BC diagnosis due to its higher cost. Our findings reveal that CT-based models achieved higher sensitivity, specificity, and AUC than models based on ultrasound and MRI. However, since only 4 studies on CT were included, the results should be validated using larger datasets. Therefore, future research should develop more CT-based diagnostic models using AI to expand its role in diagnosing BC.</p><p>The trade-off between sensitivity and specificity for ultrasound and MRI highlights their complementary roles in clinical practice. The high sensitivity of ultrasound models effectively reduces false negatives by excluding metastasis, whereas the high specificity of MRI models improves confirmation of positive cases by minimizing false positives. These findings support the development of an integrated multimodal DL strategy, with ultrasound as an initial screening tool and MRI for confirming difficult cases. However, real-world validation is required.</p><p>Before developing DL-based intelligent diagnostic tools, several challenges require attention. First, the impact of different imaging protocols and preprocessing methods on DL performance must be thoroughly examined. Second, DL models typically require large image datasets. Therefore, future studies should incorporate more extensive imaging data to ensure the robustness of the DL model. Third, the impact of population heterogeneity on model performance should be carefully considered. Future research should include multicenter, multiethnic cohorts when developing DL models. Fourth, external validation is essential to enhance the credibility and generalizability of these DL models. Nevertheless, most included studies relied solely on internal validation, making it difficult to conduct external validation across multiple centers. Among the 28 studies, the majority employed single-center internal validation. Therefore, future research should incorporate more multicenter studies to confirm the real-world applicability of these models.</p></sec><sec id="s4-3"><title>Study Limitations</title><p>This is the first study to systematically investigate the feasibility of DL for detecting ALNM in BC. However, several limitations should be noted. First, despite a comprehensive literature search, the number of included studies was limited, restricting in-depth analysis and the generalizability of the findings. Second, most included studies relied on random sampling validation and lacked diverse external validation, undermining the overall reliability and generalizability of the results. Third, only a few studies directly compared DL models with clinical experts, and the available data were too limited to support a robust effect size analysis. As a result, it remains uncertain whether DL surpasses clinical experts in diagnostic performance. Fourth, many studies did not provide detailed descriptions of critical aspects, such as image acquisition protocols, segmentation techniques, network architectures and inputs, and reference standards (including biopsy methods and reference intervals). Fifth, this meta-analysis relied solely on data reported in the published articles and their supplementary materials. We did not contact the corresponding authors regarding missing or incomplete data. This may have resulted in the exclusion of some potentially eligible studies, which could introduce bias if the missing data differ systematically from the included data. Sixth, most included studies were based on retrospective evidence. Therefore, future research should focus on standardizing image processing methods and conducting prospective, multicenter external validations to develop DL models with enhanced robustness and broader applicability. Finally, this meta-analysis incorporated validation cohorts from the included studies. For studies that provided multiple validation cohorts, each cohort was included as an independent data point in the analysis. This approach may violate the inherent assumption of independence in the standard BME model. While we conducted a sensitivity analysis by extracting only a single validation cohort per original study, this alternative method may also introduce a certain degree of publication bias. Consequently, although DL models show promise for detecting ALNM, the current findings should be interpreted with caution. Future prospective studies with preregistered protocols are needed to verify these results and minimize publication bias.</p></sec><sec id="s4-4"><title>Conclusions</title><p>This study revealed that DL models based on medical imaging showed promising accuracy in detecting ALNM in patients with BC. These findings may provide an evidence-based foundation for developing intelligent diagnostic tools. However, the findings were primarily based on models developed from single-center, retrospective datasets. Therefore, future studies should adopt a series of strategies, including but not limited to expanding the sample size, integrating multimodal imaging for joint modeling, and conducting prospective validation, to further enhance the performance of DL models while ensuring their applicability and clinical utility.</p></sec></sec></body><back><ack><p>We confirm that no generative artificial intelligence tools were used at any stage in the preparation of this paper. All content, including references and citations, is the original work of the authors, who take full responsibility for its accuracy and integrity.</p></ack><notes><sec><title>Funding</title><p>This work was supported by the National Natural Science Foundation of China (grant number 82072909) and by the Hospital-Level Research Project of Subei People's Hospital of Jiangsu Province (grant number SBQN25007).</p></sec><sec><title>Data Availability</title><p>The data that support the findings of this study are available from the corresponding author upon reasonable request.</p></sec></notes><fn-group><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">ALNM</term><def><p>axillary lymph node metastasis</p></def></def-item><def-item><term id="abb3">AUC</term><def><p>area under the summary receiver operating characteristic curve</p></def></def-item><def-item><term id="abb4">BC</term><def><p>breast cancer</p></def></def-item><def-item><term id="abb5">BME</term><def><p>bivariate mixed effects</p></def></def-item><def-item><term id="abb6">CT</term><def><p>computed tomography</p></def></def-item><def-item><term id="abb7">DL</term><def><p>deep learning</p></def></def-item><def-item><term id="abb8">DOR</term><def><p>diagnostic odds ratio</p></def></def-item><def-item><term id="abb9">LR+</term><def><p>positive likelihood ratio</p></def></def-item><def-item><term id="abb10">LR&#x2212;</term><def><p>negative likelihood ratio</p></def></def-item><def-item><term id="abb11">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb12">MRI</term><def><p>magnetic resonance imaging</p></def></def-item><def-item><term id="abb13">PRISMA</term><def><p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses</p></def></def-item><def-item><term id="abb14">PROSPERO </term><def><p>Prospective Register of Systematic Reviews</p></def></def-item><def-item><term id="abb15">RoB</term><def><p>risk of bias</p></def></def-item><def-item><term id="abb16">TP</term><def><p>true positive</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kim</surname><given-names>J</given-names> </name><name name-style="western"><surname>Harper</surname><given-names>A</given-names> </name><name name-style="western"><surname>McCormack</surname><given-names>V</given-names> </name><etal/></person-group><article-title>Global patterns and trends in breast cancer incidence and mortality across 185 countries</article-title><source>Nat Med</source><year>2025</year><month>04</month><volume>31</volume><issue>4</issue><fpage>1154</fpage><lpage>1162</lpage><pub-id pub-id-type="doi">10.1038/s41591-025-03502-3</pub-id><pub-id pub-id-type="medline">39994475</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Siegel</surname><given-names>RL</given-names> </name><name name-style="western"><surname>Giaquinto</surname><given-names>AN</given-names> </name><name name-style="western"><surname>Jemal</surname><given-names>A</given-names> </name></person-group><article-title>Cancer statistics, 2024</article-title><source>CA Cancer J Clin</source><year>2024</year><volume>74</volume><issue>1</issue><fpage>12</fpage><lpage>49</lpage><pub-id pub-id-type="doi">10.3322/caac.21820</pub-id><pub-id pub-id-type="medline">38230766</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sung</surname><given-names>H</given-names> </name><name name-style="western"><surname>Ferlay</surname><given-names>J</given-names> </name><name name-style="western"><surname>Siegel</surname><given-names>RL</given-names> </name><etal/></person-group><article-title>Global cancer statistics 2020: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries</article-title><source>CA Cancer J Clin</source><year>2021</year><month>05</month><volume>71</volume><issue>3</issue><fpage>209</fpage><lpage>249</lpage><pub-id pub-id-type="doi">10.3322/caac.21660</pub-id><pub-id pub-id-type="medline">33538338</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schmid</surname><given-names>P</given-names> </name><name name-style="western"><surname>Cortes</surname><given-names>J</given-names> </name><name name-style="western"><surname>Dent</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Overall survival with pembrolizumab in early-stage triple-negative breast cancer</article-title><source>N Engl J Med</source><year>2024</year><month>11</month><day>28</day><volume>391</volume><issue>21</issue><fpage>1981</fpage><lpage>1991</lpage><pub-id pub-id-type="doi">10.1056/NEJMoa2409932</pub-id><pub-id pub-id-type="medline">39282906</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Strnad</surname><given-names>V</given-names> </name><name name-style="western"><surname>Polg&#x00E1;r</surname><given-names>C</given-names> </name><name name-style="western"><surname>Ott</surname><given-names>OJ</given-names> </name><etal/></person-group><article-title>Accelerated partial breast irradiation using sole interstitial multicatheter brachytherapy compared with whole-breast irradiation with boost for early breast cancer: 10-year results of a GEC-ESTRO randomised, phase 3, non-inferiority trial</article-title><source>Lancet Oncol</source><year>2023</year><month>03</month><volume>24</volume><issue>3</issue><fpage>262</fpage><lpage>272</lpage><pub-id pub-id-type="doi">10.1016/S1470-2045(23)00018-9</pub-id><pub-id pub-id-type="medline">36738756</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>XC</given-names> </name><name name-style="western"><surname>Jiao</surname><given-names>DC</given-names> </name><name name-style="western"><surname>Qiao</surname><given-names>JH</given-names> </name><etal/></person-group><article-title>De-escalated neoadjuvant weekly nab-paclitaxel with trastuzumab and pertuzumab versus docetaxel, carboplatin, trastuzumab, and pertuzumab in patients with HER2-positive early breast cancer (HELEN-006): a multicentre, randomised, phase 3 trial</article-title><source>Lancet Oncol</source><year>2025</year><month>01</month><volume>26</volume><issue>1</issue><fpage>27</fpage><lpage>36</lpage><pub-id pub-id-type="doi">10.1016/S1470-2045(24)00581-3</pub-id><pub-id pub-id-type="medline">39612919</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chang</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Leung</surname><given-names>JWT</given-names> </name><name name-style="western"><surname>Moy</surname><given-names>L</given-names> </name><name name-style="western"><surname>Ha</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Moon</surname><given-names>WK</given-names> </name></person-group><article-title>Axillary nodal evaluation in breast cancer: state of the art</article-title><source>Radiology</source><year>2020</year><month>06</month><volume>295</volume><issue>3</issue><fpage>500</fpage><lpage>515</lpage><pub-id pub-id-type="doi">10.1148/radiol.2020192534</pub-id><pub-id pub-id-type="medline">32315268</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Greener</surname><given-names>JG</given-names> </name><name name-style="western"><surname>Kandathil</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Moffat</surname><given-names>L</given-names> </name><name name-style="western"><surname>Jones</surname><given-names>DT</given-names> </name></person-group><article-title>A guide to machine learning for biologists</article-title><source>Nat Rev Mol Cell Biol</source><year>2022</year><month>01</month><volume>23</volume><issue>1</issue><fpage>40</fpage><lpage>55</lpage><pub-id pub-id-type="doi">10.1038/s41580-021-00407-0</pub-id><pub-id pub-id-type="medline">34518686</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Elemento</surname><given-names>O</given-names> </name><name name-style="western"><surname>Leslie</surname><given-names>C</given-names> </name><name name-style="western"><surname>Lundin</surname><given-names>J</given-names> </name><name name-style="western"><surname>Tourassi</surname><given-names>G</given-names> </name></person-group><article-title>Artificial intelligence in cancer research, diagnosis and therapy</article-title><source>Nat Rev Cancer</source><year>2021</year><month>12</month><volume>21</volume><issue>12</issue><fpage>747</fpage><lpage>752</lpage><pub-id pub-id-type="doi">10.1038/s41568-021-00399-1</pub-id><pub-id pub-id-type="medline">34535775</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Swanson</surname><given-names>K</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>E</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>A</given-names> </name><name name-style="western"><surname>Alizadeh</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Zou</surname><given-names>J</given-names> </name></person-group><article-title>From patterns to patients: advances in clinical machine learning for cancer diagnosis, prognosis, and treatment</article-title><source>Cell</source><year>2023</year><month>04</month><day>13</day><volume>186</volume><issue>8</issue><fpage>1772</fpage><lpage>1791</lpage><pub-id pub-id-type="doi">10.1016/j.cell.2023.01.035</pub-id><pub-id pub-id-type="medline">36905928</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhan</surname><given-names>T</given-names> </name></person-group><article-title>DL 101: basic introduction to deep learning with its application in biomedical related fields</article-title><source>Stat Med</source><year>2022</year><month>11</month><day>20</day><volume>41</volume><issue>26</issue><fpage>5365</fpage><lpage>5378</lpage><pub-id pub-id-type="doi">10.1002/sim.9564</pub-id><pub-id pub-id-type="medline">36041380</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jiang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Biology-guided deep learning predicts prognosis and cancer immunotherapy response</article-title><source>Nat Commun</source><year>2023</year><month>08</month><day>23</day><volume>14</volume><issue>1</issue><fpage>5135</fpage><pub-id pub-id-type="doi">10.1038/s41467-023-40890-x</pub-id><pub-id pub-id-type="medline">37612313</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhong</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Cai</surname><given-names>C</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>T</given-names> </name><etal/></person-group><article-title>PET/CT based cross-modal deep learning signature to predict occult nodal metastasis in lung cancer</article-title><source>Nat Commun</source><year>2023</year><month>11</month><day>18</day><volume>14</volume><issue>1</issue><fpage>7513</fpage><pub-id pub-id-type="doi">10.1038/s41467-023-42811-4</pub-id><pub-id pub-id-type="medline">37980411</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Park</surname><given-names>TY</given-names> </name><name name-style="western"><surname>Kwon</surname><given-names>LM</given-names> </name><name name-style="western"><surname>Hyeon</surname><given-names>J</given-names> </name><name name-style="western"><surname>Cho</surname><given-names>BJ</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>BJ</given-names> </name></person-group><article-title>Deep learning prediction of axillary lymph node metastasis in breast cancer patients using clinical implication-applied preprocessed ct images</article-title><source>Curr Oncol</source><year>2024</year><month>04</month><day>18</day><volume>31</volume><issue>4</issue><fpage>2278</fpage><lpage>2288</lpage><pub-id pub-id-type="doi">10.3390/curroncol31040169</pub-id><pub-id pub-id-type="medline">38668072</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>L</given-names> </name><name name-style="western"><surname>Dong</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Deep learning radiomics of preoperative breast MRI for prediction of axillary lymph node metastasis in breast cancer</article-title><source>J Digit Imaging</source><year>2023</year><month>08</month><volume>36</volume><issue>4</issue><fpage>1323</fpage><lpage>1331</lpage><pub-id pub-id-type="doi">10.1007/s10278-023-00818-9</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>WB</given-names> </name><name name-style="western"><surname>Du</surname><given-names>ZC</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>YJ</given-names> </name><etal/></person-group><article-title>Prediction of axillary lymph node metastasis in early breast cancer patients with ultrasonic videos based deep learning</article-title><source>Front Oncol</source><year>2023</year><volume>13</volume><fpage>1219838</fpage><pub-id pub-id-type="doi">10.3389/fonc.2023.1219838</pub-id><pub-id pub-id-type="medline">37719009</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Whiting</surname><given-names>PF</given-names> </name><name name-style="western"><surname>Rutjes</surname><given-names>AWS</given-names> </name><name name-style="western"><surname>Westwood</surname><given-names>ME</given-names> </name><etal/></person-group><article-title>QUADAS-2: a revised tool for the quality assessment of diagnostic accuracy studies</article-title><source>Ann Intern Med</source><year>2011</year><month>10</month><day>18</day><volume>155</volume><issue>8</issue><fpage>529</fpage><lpage>536</lpage><pub-id pub-id-type="doi">10.7326/0003-4819-155-8-201110180-00009</pub-id><pub-id pub-id-type="medline">22007046</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gong</surname><given-names>C</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Computer-assisted diagnosis for axillary lymph node metastasis of early breast cancer based on transformer with dual-modal adaptive mid-term fusion using ultrasound elastography</article-title><source>Comput Med Imaging Graph</source><year>2025</year><month>01</month><volume>119</volume><fpage>102472</fpage><pub-id pub-id-type="doi">10.1016/j.compmedimag.2024.102472</pub-id><pub-id pub-id-type="medline">39612691</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Agyekum</surname><given-names>EA</given-names> </name><name name-style="western"><surname>Kong</surname><given-names>W</given-names> </name><name name-style="western"><surname>Agyekum</surname><given-names>DN</given-names> </name><etal/></person-group><article-title>Ultrasound derived deep learning features for predicting axillary lymph node metastasis in breast cancer using graph convolutional networks in a multicenter study</article-title><source>Sci Rep</source><year>2025</year><month>07</month><day>30</day><volume>15</volume><issue>1</issue><fpage>27796</fpage><pub-id pub-id-type="doi">10.1038/s41598-025-13086-0</pub-id><pub-id pub-id-type="medline">40738938</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Ding</surname><given-names>Z</given-names> </name><etal/></person-group><article-title>Applying a multi-task and multi-instance framework to predict axillary lymph node metastases in breast cancer</article-title><source>NPJ Precis Oncol</source><year>2025</year><month>06</month><day>18</day><volume>9</volume><issue>1</issue><fpage>195</fpage><pub-id pub-id-type="doi">10.1038/s41698-025-00971-0</pub-id><pub-id pub-id-type="medline">40533499</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gu</surname><given-names>C</given-names> </name><name name-style="western"><surname>He</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Preoperative prediction of axillary lymph node metastasis in breast invasive ductal carcinoma patients using a deep learning model based on dynamic contrast-enhanced magnetic resonance imaging: a multicenter study</article-title><source>Gland Surg</source><year>2025</year><month>11</month><day>30</day><volume>14</volume><issue>11</issue><fpage>2288</fpage><lpage>2301</lpage><pub-id pub-id-type="doi">10.21037/gs-2025-365</pub-id><pub-id pub-id-type="medline">41377877</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dai</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Liang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Predicting axillary lymph node metastasis in breast cancer patients using CNN-GCN on DCE-MRI: a multicenter study</article-title><source>BMC Med Imaging</source><year>2025</year><month>11</month><day>20</day><volume>25</volume><issue>1</issue><fpage>481</fpage><pub-id pub-id-type="doi">10.1186/s12880-025-01988-4</pub-id><pub-id pub-id-type="medline">41266995</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sun</surname><given-names>J</given-names> </name><name name-style="western"><surname>Xi</surname><given-names>X</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>M</given-names> </name><etal/></person-group><article-title>A deep learning model based on chest CT to predict benign and malignant breast masses and axillary lymph node metastasis</article-title><source>Biomol Biomed</source><year>2025</year><month>03</month><day>17</day><volume>26</volume><issue>1</issue><fpage>91</fpage><lpage>99</lpage><pub-id pub-id-type="doi">10.17305/bb.2025.12010</pub-id><pub-id pub-id-type="medline">40100034</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Nie</surname><given-names>L</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>Q</given-names> </name><etal/></person-group><article-title>Artificial intelligence assisted ultrasound for the non-invasive prediction of axillary lymph node metastasis in breast cancer</article-title><source>BMC Cancer</source><year>2024</year><month>07</month><day>29</day><volume>24</volume><issue>1</issue><fpage>910</fpage><pub-id pub-id-type="doi">10.1186/s12885-024-12619-6</pub-id><pub-id pub-id-type="medline">39075447</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Polat</surname><given-names>DS</given-names> </name><name name-style="western"><surname>Nguyen</surname><given-names>S</given-names> </name><name name-style="western"><surname>Karbasi</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Machine learning prediction of lymph node metastasis in breast cancer: performance of a multi-institutional MRI-based 4D convolutional neural network</article-title><source>Radiol Imaging Cancer</source><year>2024</year><month>05</month><volume>6</volume><issue>3</issue><fpage>e230107</fpage><pub-id pub-id-type="doi">10.1148/rycan.230107</pub-id><pub-id pub-id-type="medline">38607282</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhou</surname><given-names>H</given-names> </name><name name-style="western"><surname>Hua</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Gao</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Multitask deep learning-based whole-process system for automatic diagnosis of breast lesions and axillary lymph node metastasis discrimination from dynamic contrast-enhanced-MRI: a multicenter study</article-title><source>J Magn Reson Imaging</source><year>2024</year><month>05</month><volume>59</volume><issue>5</issue><fpage>1710</fpage><lpage>1722</lpage><pub-id pub-id-type="doi">10.1002/jmri.28913</pub-id><pub-id pub-id-type="medline">37497811</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>H</given-names> </name><name name-style="western"><surname>Zou</surname><given-names>L</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>N</given-names> </name><etal/></person-group><article-title>Deep learning radiomics based prediction of axillary lymph node metastasis in breast cancer</article-title><source>NPJ Breast Cancer</source><year>2024</year><month>03</month><day>12</day><volume>10</volume><issue>1</issue><fpage>22</fpage><pub-id pub-id-type="doi">10.1038/s41523-024-00628-4</pub-id><pub-id pub-id-type="medline">38472210</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Guo</surname><given-names>YJ</given-names> </name><name name-style="western"><surname>Yin</surname><given-names>R</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>Q</given-names> </name><etal/></person-group><article-title>MRI-based kinetic heterogeneity evaluation in the accurate access of axillary lymph node status in breast cancer using a hybrid CNN-RNN model</article-title><source>J Magn Reson Imaging</source><year>2024</year><month>10</month><volume>60</volume><issue>4</issue><fpage>1352</fpage><lpage>1364</lpage><pub-id pub-id-type="doi">10.1002/jmri.29225</pub-id><pub-id pub-id-type="medline">38205712</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wei</surname><given-names>W</given-names> </name><name name-style="western"><surname>Ma</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Feng</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Deep learning radiomics for prediction of axillary lymph node metastasis in patients with clinical stage T1-2 breast cancer</article-title><source>Quant Imaging Med Surg</source><year>2023</year><month>08</month><day>1</day><volume>13</volume><issue>8</issue><fpage>4995</fpage><lpage>5011</lpage><pub-id pub-id-type="doi">10.21037/qims-22-1257</pub-id><pub-id pub-id-type="medline">37581073</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gao</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zhong</surname><given-names>X</given-names> </name><name name-style="western"><surname>Li</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Attention-based deep learning for the preoperative differentiation of axillary lymph node metastasis in breast cancer on DCE-MRI</article-title><source>J Magn Reson Imaging</source><year>2023</year><month>06</month><volume>57</volume><issue>6</issue><fpage>1842</fpage><lpage>1853</lpage><pub-id pub-id-type="doi">10.1002/jmri.28464</pub-id><pub-id pub-id-type="medline">36219519</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ren</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Predicting of axillary lymph node metastasis in invasive breast cancer using multiparametric MRI dataset based on CNN model</article-title><source>Front Oncol</source><year>2022</year><volume>12</volume><fpage>1069733</fpage><pub-id pub-id-type="doi">10.3389/fonc.2022.1069733</pub-id><pub-id pub-id-type="medline">36561533</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>G</given-names> </name><name name-style="western"><surname>Shi</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Yin</surname><given-names>P</given-names> </name><etal/></person-group><article-title>A machine learning model based on ultrasound image features to assess the risk of sentinel lymph node metastasis in breast cancer patients:applications of scikit-learn and SHAP</article-title><source>Front Oncol</source><year>2022</year><volume>12</volume><fpage>944569</fpage><pub-id pub-id-type="doi">10.3389/fonc.2022.944569</pub-id><pub-id pub-id-type="medline">35957890</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>H</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Preoperative prediction of axillary lymph node metastasis in breast cancer using CNN based on multiparametric MRI</article-title><source>J Magn Reson Imaging</source><year>2022</year><month>09</month><volume>56</volume><issue>3</issue><fpage>700</fpage><lpage>709</lpage><pub-id pub-id-type="doi">10.1002/jmri.28082</pub-id><pub-id pub-id-type="medline">35108415</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sun</surname><given-names>S</given-names> </name><name name-style="western"><surname>Mutasa</surname><given-names>S</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>MZ</given-names> </name><etal/></person-group><article-title>Deep learning prediction of axillary lymph node status using ultrasound images</article-title><source>Comput Biol Med</source><year>2022</year><month>04</month><volume>143</volume><fpage>105250</fpage><pub-id pub-id-type="doi">10.1016/j.compbiomed.2022.105250</pub-id><pub-id pub-id-type="medline">35114444</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Santucci</surname><given-names>D</given-names> </name><name name-style="western"><surname>Faiella</surname><given-names>E</given-names> </name><name name-style="western"><surname>Gravina</surname><given-names>M</given-names> </name><etal/></person-group><article-title>CNN-based approaches with different tumor bounding options for lymph node status prediction in breast DCE-MRI</article-title><source>Cancers (Basel)</source><year>2022</year><month>09</month><day>21</day><volume>14</volume><issue>19</issue><fpage>4574</fpage><pub-id pub-id-type="doi">10.3390/cancers14194574</pub-id><pub-id pub-id-type="medline">36230497</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>C</given-names> </name><name name-style="western"><surname>Guo</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Jia</surname><given-names>L</given-names> </name><etal/></person-group><article-title>A convolutional neural network based on ultrasound images of primary breast masses: prediction of lymph-node metastasis in collaboration with classification of benign and malignant tumors</article-title><source>Front Physiol</source><year>2022</year><volume>13</volume><fpage>882648</fpage><pub-id pub-id-type="doi">10.3389/fphys.2022.882648</pub-id><pub-id pub-id-type="medline">35721528</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cattell</surname><given-names>R</given-names> </name><name name-style="western"><surname>Ying</surname><given-names>J</given-names> </name><name name-style="western"><surname>Lei</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Preoperative prediction of lymph node metastasis using deep learning-based features</article-title><source>Vis Comput Ind Biomed Art</source><year>2022</year><month>03</month><day>7</day><volume>5</volume><issue>1</issue><fpage>8</fpage><pub-id pub-id-type="doi">10.1186/s42492-022-00104-5</pub-id><pub-id pub-id-type="medline">35254557</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zeng</surname><given-names>R</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Zheng</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Decoupling convolution network for characterizing the metastatic lymph nodes of breast cancer patients</article-title><source>Med Phys</source><year>2021</year><month>07</month><volume>48</volume><issue>7</issue><fpage>3679</fpage><lpage>3690</lpage><pub-id pub-id-type="doi">10.1002/mp.14876</pub-id><pub-id pub-id-type="medline">33825207</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Ni</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Axillary lymph node metastasis prediction by contrast-enhanced computed tomography images for breast cancer patients based on deep learning</article-title><source>Comput Biol Med</source><year>2021</year><month>09</month><volume>136</volume><fpage>104715</fpage><pub-id pub-id-type="doi">10.1016/j.compbiomed.2021.104715</pub-id><pub-id pub-id-type="medline">34388460</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhou</surname><given-names>LQ</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>XL</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>SY</given-names> </name><etal/></person-group><article-title>Lymph node metastasis prediction from primary breast cancer US images using deep learning</article-title><source>Radiology</source><year>2020</year><month>01</month><volume>294</volume><issue>1</issue><fpage>19</fpage><lpage>28</lpage><pub-id pub-id-type="doi">10.1148/radiol.2019190372</pub-id><pub-id pub-id-type="medline">31746687</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zheng</surname><given-names>X</given-names> </name><name name-style="western"><surname>Yao</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Deep learning radiomics can predict axillary lymph node status in early-stage breast cancer</article-title><source>Nat Commun</source><year>2020</year><month>03</month><day>6</day><volume>11</volume><issue>1</issue><fpage>1236</fpage><pub-id pub-id-type="doi">10.1038/s41467-020-15027-z</pub-id><pub-id pub-id-type="medline">32144248</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sun</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>X</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Deep learning vs. radiomics for predicting axillary lymph node metastasis of breast cancer using ultrasound images: don&#x2019;t forget the peritumoral region</article-title><source>Front Oncol</source><year>2020</year><volume>10</volume><issue>53</issue><fpage>53</fpage><pub-id pub-id-type="doi">10.3389/fonc.2020.00053</pub-id><pub-id pub-id-type="medline">32083007</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Guo</surname><given-names>X</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Deep learning radiomics of ultrasonography: identifying the risk of axillary non-sentinel lymph node involvement in primary breast cancer</article-title><source>EBioMedicine</source><year>2020</year><month>10</month><volume>60</volume><fpage>103018</fpage><pub-id pub-id-type="doi">10.1016/j.ebiom.2020.103018</pub-id><pub-id pub-id-type="medline">32980697</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Li</surname><given-names>L</given-names> </name><name name-style="western"><surname>Zhe</surname><given-names>X</given-names> </name><etal/></person-group><article-title>The diagnostic performance of machine learning-based radiomics of DCE-MRI in predicting axillary lymph node metastasis in breast cancer: a meta-analysis</article-title><source>Front Oncol</source><year>2022</year><volume>12</volume><fpage>799209</fpage><pub-id pub-id-type="doi">10.3389/fonc.2022.799209</pub-id><pub-id pub-id-type="medline">35186739</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>C</given-names> </name><name name-style="western"><surname>Qin</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>H</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>D</given-names> </name><name name-style="western"><surname>Gao</surname><given-names>F</given-names> </name><name name-style="western"><surname>Zhou</surname><given-names>X</given-names> </name></person-group><article-title>A meta-analysis of the diagnostic performance of machine learning-based MRI in the prediction of axillary lymph node metastasis in breast cancer patients</article-title><source>Insights Imaging</source><year>2021</year><month>11</month><day>3</day><volume>12</volume><issue>1</issue><fpage>156</fpage><pub-id pub-id-type="doi">10.1186/s13244-021-01034-1</pub-id><pub-id pub-id-type="medline">34731343</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Eldaly</surname><given-names>AS</given-names> </name><name name-style="western"><surname>Avila</surname><given-names>FR</given-names> </name><name name-style="western"><surname>Torres-Guzman</surname><given-names>RA</given-names> </name><etal/></person-group><article-title>Radiomics and artificial intelligence in predicting axillary lymph node metastasis in breast cancer: a systematic review</article-title><source>Curr Med Imaging</source><year>2023</year><volume>19</volume><issue>6</issue><fpage>564</fpage><lpage>578</lpage><pub-id pub-id-type="doi">10.2174/1573405618666220822093226</pub-id><pub-id pub-id-type="medline">35996255</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>CJ</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>L</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Application of CT and MRI images based on an artificial intelligence algorithm for predicting lymph node metastasis in breast cancer patients: a meta-analysis</article-title><source>BMC Cancer</source><year>2023</year><month>11</month><day>22</day><volume>23</volume><issue>1</issue><fpage>1134</fpage><pub-id pub-id-type="doi">10.1186/s12885-023-11638-z</pub-id><pub-id pub-id-type="medline">37993845</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gong</surname><given-names>X</given-names> </name><name name-style="western"><surname>Guo</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>T</given-names> </name><name name-style="western"><surname>Peng</surname><given-names>X</given-names> </name><name name-style="western"><surname>Xing</surname><given-names>D</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>M</given-names> </name></person-group><article-title>Diagnostic performance of radiomics in predicting axillary lymph node metastasis in breast cancer: a systematic review and meta-analysis</article-title><source>Front Oncol</source><year>2022</year><volume>12</volume><fpage>1046005</fpage><pub-id pub-id-type="doi">10.3389/fonc.2022.1046005</pub-id><pub-id pub-id-type="medline">36518318</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>The complete electronic search strategies and all supplementary figures and tables for the systematic review. It includes the detailed search syntax for the PubMed, Web of Science, Embase, and Cochrane Library databases (Table S1), as well as 56 supplementary figures (Figures S1-S56) that present the supplementary data, analyses, and visualizations supporting the main findings of the review, such as sensitivity analyses, specificity analyses, the summary receiver operating characteristic curve, Deeks funnel plot, and Fagan nomogram.</p><media xlink:href="jmir_v28i1e77593_app1.doc" xlink:title="DOC File, 5206 KB"/></supplementary-material><supplementary-material id="app2"><label>Checklist 1</label><p>PRISMA checklist.</p><media xlink:href="jmir_v28i1e77593_app2.pdf" xlink:title="PDF File, 86 KB"/></supplementary-material></app-group></back></article>