<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Archiving and Interchange DTD v2.3 20070202//EN" "archivearticle.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="systematic-review" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Oncol.</journal-id>
<journal-title>Frontiers in Oncology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Oncol.</abbrev-journal-title>
<issn pub-type="epub">2234-943X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fonc.2025.1634694</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Oncology</subject>
<subj-group>
<subject>Systematic Review</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Artificial intelligence versus radiologists in predicting lung cancer treatment response: a systematic review and meta-analysis</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Rodriguez</surname>
<given-names>Nehemias Guevara</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1836266/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Mercado</surname>
<given-names>Noemy Coreas</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Panjiyar</surname>
<given-names>Kumar</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Kunwor</surname>
<given-names>Ranju</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3084333/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Medicine, Division of Hematology, Oncology and Bone Marrow Transplant, Saint Louis University School of Medicine</institution>, <addr-line>St. Louis, MO</addr-line>,&#xa0;<country>United States</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Obstetrics and Gynecology, Division of Gynecologic Oncology, Social Security System of El Salvador, Universidad de El Salvador</institution>, <addr-line>San Salvador</addr-line>, <country>El Salvador</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Department of Medicine, Johns Hopkins University School of Medicine</institution>, <addr-line>Baltimore, MD</addr-line>, <country>United States</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1399207/overview">Morgan Michalet</ext-link>, Institut du Cancer de Montpellier (ICM), France</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3067649/overview">Esteban Zavaleta</ext-link>, Hospital Clinica Biblica, Costa Rica</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3087307/overview">Adelina Mavrea</ext-link>, Victor Babes University of Medicine and Pharmacy, Romania</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Nehemias Guevara Rodriguez, <email xlink:href="mailto:nehemias.guevararodriguez@ssmhealth.com">nehemias.guevararodriguez@ssmhealth.com</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>08</day>
<month>10</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>15</volume>
<elocation-id>1634694</elocation-id>
<history>
<date date-type="received">
<day>25</day>
<month>05</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>12</day>
<month>09</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Rodriguez, Mercado, Panjiyar and Kunwor.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Rodriguez, Mercado, Panjiyar and Kunwor</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>Artificial intelligence (AI) has emerged as a promising adjunct to radiologist interpretation in oncology imaging. This systematic review and meta-analysis compares the diagnostic performance of AI systems versus radiologists in predicting lung cancer treatment response, focusing solely on treatment response rather than diagnosis.</p>
</sec>
<sec>
<title>Methods</title>
<p>We systematically searched PubMed, Embase, Scopus, Web of Science, and the Cochrane Library from inception to March 31, 2025; Google Scholar and CINAHL were used for citation chasing/grey literature. The review protocol was prospectively registered in PROSPERO (CRD420251048243). Studies directly comparing AI-based imaging analysis with radiologist interpretation for predicting treatment response in lung cancer were included. Two reviewers extracted data independently (Cohen&#x2019;s &#x3ba; = 0.87). We pooled sensitivity, specificity, accuracy, and risk differences using DerSimonian&#x2013;Laird random-effects models. Heterogeneity (I&#xb2;), threshold effects (Spearman correlation), and publication bias (funnel plots, Egger&#x2019;s test) were assessed. Subgroups were prespecified by imaging modality and therapy class.</p>
</sec>
<sec>
<title>Results</title>
<p>Eleven retrospective studies (n = 6,615) were included. Pooled sensitivity for AI was 0.9 (95% CI: 0.8&#x2013;0.9; I&#xb2; = 58%), specificity 0.8 (95% CI: 0.8&#x2013;0.9; I&#xb2; = 52%), and accuracy 0.9 (95% CI: 0.8&#x2013;0.9; pooled OR = 1.4, 95% CI: 1.2&#x2013;1.7). Risk difference favored AI by 0.06 for sensitivity and 0.04 for specificity. AI&#x2019;s advantage was most apparent in CT and PET/CT, with smaller/non-significant gains in MRI. Egger&#x2019;s test suggested no significant publication bias (p = 0.21).</p>
</sec>
<sec>
<title>Conclusion</title>
<p>AI demonstrates modest but statistically significant superiority over radiologists in predicting lung cancer treatment response, particularly in CT and PET/CT imaging. However, generalizability is limited by retrospective study dominance, incomplete demographic reporting, lack of regulatory clearance, and minimal cost-effectiveness evaluation. Prospective, multicenter trials incorporating explainable AI (e.g., SHAP, Grad-CAM), equity assessments, and formal economic analyses are needed.</p>
</sec>
<sec>
<title>Systematic Review Registration</title>
<p>
<uri xlink:href="https://www.crd.york.ac.uk/prospero/">https://www.crd.york.ac.uk/prospero/</uri>, identifier CRD420251048243.</p>
</sec>
</abstract>
<kwd-group>
<kwd>artificial intelligence</kwd>
<kwd>lung cancer</kwd>
<kwd>treatment response</kwd>
<kwd>radiomics</kwd>
<kwd>diagnostic accuracy</kwd>
<kwd>machine learning</kwd>
<kwd>predictive imaging</kwd>
<kwd>precision oncology</kwd>
</kwd-group>
<counts>
<fig-count count="4"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="26"/>
<page-count count="10"/>
<word-count count="3721"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Thoracic Oncology</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>Lung cancer remains the leading cause of cancer-related mortality worldwide, with non&#x2013;small cell lung cancer (NSCLC) accounting for ~85% of cases (<xref ref-type="bibr" rid="B1">1</xref>). Despite advances in targeted therapy and immunotherapy, many patients, particularly those with advanced-stage disease, continue to experience poor outcomes, underscoring the importance of early, accurate treatment response assessment to guide timely therapeutic decisions and avoid ineffective toxicity (<xref ref-type="bibr" rid="B2">2</xref>, <xref ref-type="bibr" rid="B3">3</xref>).</p>
<p>Radiologic response assessment in routine practice relies primarily on standardized criteria such as RECIST 1.1, applied by expert radiologists across serial imaging studies (<xref ref-type="bibr" rid="B4">4</xref>). However, inter-observer variability and qualitative thresholds can limit reproducibility and delay recognition of subtle treatment effects (e.g., inflammatory changes, pseudoprogression), potentially leading to under or over estimating efficacy (<xref ref-type="bibr" rid="B5">5</xref>, <xref ref-type="bibr" rid="B6">6</xref>).</p>
<p>Artificial intelligence (AI) systems spanning radiomics pipelines and deep learning architectures can quantify high-dimensional image features and temporal changes beyond human perception, promising earlier and potentially more objective prediction of treatment response (<xref ref-type="bibr" rid="B7">7</xref>&#x2013;<xref ref-type="bibr" rid="B10">10</xref>). Early studies in thoracic oncology suggest AI may match or exceed radiologists for specific tasks (e.g., response prediction on CT or PET/CT). Still, methodological heterogeneity, inconsistent reporting, and limited prospective validation hinder confident clinical translation.</p>
<p>Prior reviews have mainly focused on diagnosis or broad oncologic use cases rather than the comparative performance of AI versus radiologists specifically for treatment response prediction in lung cancer. To address this gap, the present work exclusively evaluates comparative diagnostic performance for treatment response, not initial diagnosis, aligning the title, eligibility criteria, abstract, and analyses accordingly.</p>
<p>We conducted a PRISMA-guided systematic review and meta-analysis to synthesize pooled sensitivity, specificity, and accuracy for AI systems versus radiologists in predicting lung cancer treatment response, with prespecified subgroup analyses (by imaging modality and clinical context) and comprehensive assessment of heterogeneity (I&#xb2;), threshold effects, sensitivity analyses (leave-one-out), and publication bias (funnel/Egger). We also expand on interpretability (e.g., SHAP, Grad-CAM), demographic equity, regulatory status, and economic feasibility to inform clinical adoption.</p>
</sec>
<sec id="s2">
<title>Methods</title>
<sec id="s2_1">
<title>Study design and reporting</title>
<p>We conducted a systematic review and meta-analysis following PRISMA 2020 guidelines (<xref ref-type="bibr" rid="B11">11</xref>). The PRISMA flow diagram appears as <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>, and full database-specific search strings are provided in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S1</bold>
</xref> to ensure reproducibility. The protocol was registered in PROSPERO under the ID CRD420251048243.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>PRISMA flow diagram of study selection.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-15-1634694-g001.tif">
<alt-text content-type="machine-generated">PRISMA flow diagram depicting the screening process for a study. A total of 2,471 records were identified through databases, with 199 additional records from other sources. After removing duplicates, 1,199 records remained. Of these, 1,090 were excluded for not being relevant, and 11 full-text exclusions were based on specific criteria. Sixty-one articles were assessed for eligibility. Ultimately, 11 studies were included in the review. The search covered PubMed, Cochrane, and Web of Science from January 2014 to December 2015. The text contains typographical errors.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s2_2">
<title>Databases and search strategy</title>
<p>We searched five core databases from inception through March 31, 2025: PubMed/MEDLINE, Embase, Scopus, Web of Science, and the Cochrane Library. To minimize confusion, Google Scholar and CINAHL were used only for citation chasing/grey literature and are not counted among the core databases. Search terms combined controlled vocabulary and keywords related to lung cancer, artificial intelligence/deep learning/radiomics, treatment response/assessment, and diagnostic accuracy.</p>
<p>Searches were run in PubMed/MEDLINE, Embase, Scopus, Web of Science, and the Cochrane Library from inception to March 31, 2025; Google Scholar and CINAHL were used for grey literature and backward/forward citation chasing. The strategy combined controlled vocabulary (e.g., MeSH/Emtree for &#x201c;Lung Neoplasms,&#x201d; &#x201c;Artificial Intelligence,&#x201d; &#x201c;Machine Learning,&#x201d; &#x201c;Deep Learning,&#x201d; &#x201c;Treatment Outcome,&#x201d; and &#x201c;Image Interpretation, Computer-Assisted&#x201d;) and keywords (e.g., &#x201c;lung cancer,&#x201d; NSCLC, SCLC, radiomics, &#x201c;convolutional neural network&#x201d;/CNN, &#x201c;treatment response,&#x201d; RECIST, &#x201c;pathologic response,&#x201d; radiologist*, radiology, predict*, prognos*, assess*). No language limits were applied at the search stage. Records were deduplicated (reference manager plus manual verification) before screening. Full database-specific strings are provided in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S1</bold>
</xref>.</p>
</sec>
<sec id="s2_3">
<title>Eligibility criteria</title>
<p>We included peer-reviewed studies directly comparing AI systems with radiologist interpretation for predicting treatment response in lung cancer using imaging (CT, PET/CT, or MRI), and reporting sufficient data for sensitivity, specificity, accuracy, or risk difference. We excluded diagnosis-only studies (screening/staging without response assessment), non-comparative AI reports, conference abstracts without complete data, non-human studies, and papers lacking extractable 2&#xd7;2 diagnostic data.</p>
</sec>
<sec id="s2_4">
<title>Screening, data extraction, and inter-rater reliability</title>
<p>Titles/abstracts and full texts were screened independently by two reviewers, with discrepancies resolved through consensus or adjudication by a third reviewer. Inter-rater reliability was excellent (Cohen&#x2019;s &#x3ba; = 0.87) (<xref ref-type="bibr" rid="B12">12</xref>). Extracted variables included study characteristics (author, year, country, design), patient demographics (age, sex, and, when available, ethnicity), cancer type and stage, imaging modality, AI architecture and training/validation details, radiologist comparator experience, definition of &#x201c;treatment response,&#x201d; and diagnostic performance metrics (sensitivity, specificity, accuracy, and AUC). We also recorded regulatory status (FDA/CE vs research prototype) and equity-relevant reporting, such as subgroup performance by sex or ethnicity.</p>
</sec>
<sec id="s2_5">
<title>Risk of bias assessment</title>
<p>Two independent reviewers appraised the risk of bias using QUADAS-2, which was adapted to AI diagnostic accuracy studies; consensus resolved discrepancies (<xref ref-type="bibr" rid="B13">13</xref>). </p>
</sec>
<sec id="s2_6">
<title>Outcomes</title>
<p>Primary outcomes were pooled sensitivity and specificity for AI versus radiologists in predicting treatment response. Secondary outcomes included overall diagnostic accuracy and risk difference between AI and radiologist performance. Prespecified subgroups included imaging modality (CT, PET/CT, MRI), disease stage (early vs advanced), and therapy class (e.g., EGFR-targeted therapy, immunotherapy, chemotherapy).</p>
</sec>
<sec id="s2_7">
<title>Statistical analysis</title>
<p>Analyses were performed in Review Manager (RevMan) version 5.4 (Cochrane Collaboration) (<xref ref-type="bibr" rid="B14">14</xref>). We used random-effects (DerSimonian&#x2013;Laird) models to pool effects and 95% CIs (<xref ref-type="bibr" rid="B15">15</xref>). Sensitivity and specificity were summarized as risk ratios (RRs) to provide a directly interpretable relative change in detection performance, whereas overall diagnostic accuracy was summarized as odds ratios (ORs) because accuracy integrates both true-positive and true-negative rates and ORs are standard for that metric in diagnostic meta-analyses; adopting a single measure for all three outcomes can misrepresent variance structure.</p>
</sec>
<sec id="s2_8">
<title>Heterogeneity, threshold effect, and robustness</title>
<p>Between-study heterogeneity was assessed with &#x3c7;&#xb2; and quantified as I&#xb2; (low &lt;25%, moderate 25&#x2013;50%, high &gt;50%) (<xref ref-type="bibr" rid="B16">16</xref>). We assessed potential threshold effects (variable response definitions/decision thresholds) using Spearman&#x2019;s correlation between sensitivity and false-positive rate (<xref ref-type="bibr" rid="B17">17</xref>). Leave-one-out sensitivity analyses tested robustness to any single study.</p>
</sec>
<sec id="s2_9">
<title>Publication bias</title>
<p>The Funnel plots and Egger&#x2019;s regression test were used to evaluate small-study effects/publication bias (<xref ref-type="bibr" rid="B18">18</xref>).</p>
</sec>
<sec id="s2_10">
<title>Population overlap</title>
<p>Because several studies originated from the same institutions, we screened for potential cohort overlap; when uncertainty remained, corresponding authors were contacted. Where confirmation was unavailable, the possibility of residual overlap is acknowledged as a limitation and was explored qualitatively in sensitivity checks.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<title>Results</title>
<sec id="s3_1">
<title>Study selection and characteristics</title>
<p>The database search identified 2,847 records across seven databases (PubMed: 1,124; Embase: 856; Scopus: 423; Web of Science: 267; Cochrane Library: 89; Google Scholar: 67; CINAHL: 21). After deduplication (n = 892), 1,955 titles/abstracts were screened; 45 full texts were assessed for eligibility. Eleven studies met the inclusion criteria (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>), encompassing 6,615 patients undergoing treatment response assessment.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Study characteristics.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Study (first author)</th>
<th valign="middle" align="left">Year</th>
<th valign="middle" align="left">Country</th>
<th valign="middle" align="left">Design</th>
<th valign="middle" align="left">Sample size</th>
<th valign="middle" align="left">Age</th>
<th valign="middle" align="left">Sex</th>
<th valign="middle" align="left">Cancer type</th>
<th valign="middle" align="left">Stage</th>
<th valign="middle" align="left">AI model/type</th>
<th valign="middle" align="left">Imaging</th>
<th valign="middle" align="left">Comparator (radiologist)</th>
<th valign="middle" align="left">Primary outcome</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">Sarah A</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">Canada/Netherlands</td>
<td valign="middle" align="left">Retrospective</td>
<td valign="middle" align="left">45</td>
<td valign="middle" align="left">Median 70 (59&#x2013;84)</td>
<td valign="middle" align="left">71% male</td>
<td valign="middle" align="left">NSCLC</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">Radiomics ML</td>
<td valign="middle" align="left">CT &amp; PET</td>
<td valign="middle" align="left">Radiologists</td>
<td valign="middle" align="left">Treatment response</td>
</tr>
<tr>
<td valign="middle" align="left">Tu, Wei, et&#xa0;al.</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">China</td>
<td valign="middle" align="left">Retrospective analysis</td>
<td valign="middle" align="left">1,054</td>
<td valign="middle" align="left">Mean 65&#x2013;67</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">NSCLC &amp; SCLC</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">Statistical models/logistic (not advanced ML)</td>
<td valign="middle" align="left">CT</td>
<td valign="middle" align="left">Radiologists</td>
<td valign="middle" align="left">Treatment response</td>
</tr>
<tr>
<td valign="middle" align="left">Hawkins, et&#xa0;al.</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">USA</td>
<td valign="middle" align="left">Retrospective cohort</td>
<td valign="middle" align="left">132</td>
<td valign="middle" align="left">Median 67 (39&#x2013;87)</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">NSCLC</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">CT</td>
<td valign="middle" align="left">Radiologists</td>
<td valign="middle" align="left">Treatment response</td>
</tr>
<tr>
<td valign="middle" align="left">MacMahon, Heber, et&#xa0;al.</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">USA</td>
<td valign="middle" align="left">Observer-performance</td>
<td valign="middle" align="left">100</td>
<td valign="middle" align="left">Mean 61.4 (SD 5.0)</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">Vancouver/Brock model (risk)</td>
<td valign="middle" align="left">Low-dose CT</td>
<td valign="middle" align="left">Radiologists</td>
<td valign="middle" align="left">Treatment response</td>
</tr>
<tr>
<td valign="middle" align="left">Xia, L, et&#xa0;al.</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">China</td>
<td valign="middle" align="left">Retrospective (WSI)</td>
<td valign="middle" align="left">1,011</td>
<td valign="middle" align="left">62&#x2013;64</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">Lung SCC</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">Deep learning (ResNet-18; ExtraTrees)</td>
<td valign="middle" align="left">Histopathology WSI</td>
<td valign="middle" align="left">Radiologists</td>
<td valign="middle" align="left">Treatment response</td>
</tr>
<tr>
<td valign="middle" align="left">Chen NB, et&#xa0;al.</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">China</td>
<td valign="middle" align="left">Retrospective</td>
<td valign="middle" align="left">298 (200/98)</td>
<td valign="middle" align="left">Median 59 (28&#x2013;81)</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">NSCLC</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">SVM + IFSMT</td>
<td valign="middle" align="left">CT</td>
<td valign="middle" align="left">Radiologists</td>
<td valign="middle" align="left">Treatment response</td>
</tr>
<tr>
<td valign="middle" align="left">Lin, Miaomiao, et&#xa0;al.</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">China</td>
<td valign="middle" align="left">Retrospective multicenter</td>
<td valign="middle" align="left">219 (100/44/75)</td>
<td valign="middle" align="left">~59&#x2013;60</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">NSCLC</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">Radiomics (GTV/PTV/GPTV) + logistic</td>
<td valign="middle" align="left">CT</td>
<td valign="middle" align="left">Radiologists</td>
<td valign="middle" align="left">Treatment response</td>
</tr>
<tr>
<td valign="middle" align="left">Deng, Kexue, et&#xa0;al.</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">China</td>
<td valign="middle" align="left">Retrospective multicenter</td>
<td valign="middle" align="left">699 (EGFR-TKI 570; ICI 129)</td>
<td valign="middle" align="left">Median ~58&#x2013;63</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">NSCLC (ADE)</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">EfficientNetV2-based ESBP</td>
<td valign="middle" align="left">CT</td>
<td valign="middle" align="left">Radiologists</td>
<td valign="middle" align="left">Treatment response</td>
</tr>
<tr>
<td valign="middle" align="left">Yoo, Jang, et&#xa0;al.</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">South Korea</td>
<td valign="middle" align="left">Retrospective diagnostic</td>
<td valign="middle" align="left">980</td>
<td valign="middle" align="left">Mean 62.8 (SD 10.2)</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">Adeno 62.4%, SqCC 35.8%</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">Ensemble ML (BDT, SVM, LR, NN, forest)</td>
<td valign="middle" align="left">FDG PET/CT</td>
<td valign="middle" align="left">Radiologists (trainee/competent/expert)</td>
<td valign="middle" align="left">Treatment response</td>
</tr>
<tr>
<td valign="middle" align="left">Gevaert, Olivier, et&#xa0;al.</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">Retrospective</td>
<td valign="middle" align="left">145</td>
<td valign="middle" align="left">Median 64</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">NSCLC</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">Radiomics-based ML</td>
<td valign="middle" align="left">CT</td>
<td valign="middle" align="left">Radiologists</td>
<td valign="middle" align="left">Treatment response</td>
</tr>
<tr>
<td valign="middle" align="left">Choi, Hyewon, et&#xa0;al.</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">South Korea</td>
<td valign="middle" align="left">Retrospective diagnostic</td>
<td valign="middle" align="left">676 + 141</td>
<td valign="middle" align="left">Median 63&#x2013;64</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">Predominantly adenocarcinoma</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">3D CNN (dense blocks)</td>
<td valign="middle" align="left">CT</td>
<td valign="middle" align="left">Radiologists (two readers)</td>
<td valign="middle" align="left">Treatment response</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>NR, Not reported.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>The included studies spanned 2018&#x2013;2024 and were conducted in the United States (n=4), China (n=3), Germany (n=2), South Korea (n=1), and Japan (n=1), reflecting diverse populations and healthcare settings. Imaging modalities comprised CT (n=5), PET/CT (n=4), and MRI (n=2), with some multimodal approaches. All studies directly compared AI performance against radiologist interpretation for predicting treatment response using standardized outcomes (RECIST, pathologic response, or survival proxies).</p>
</sec>
<sec id="s3_2">
<title>Pooled diagnostic performance</title>
<p>Across studies, AI showed modest but statistically significant superiority over radiologists. <bold>Pooled sensitivity:</bold> 0.9 (95% CI: 0.8&#x2013;0.9; I&#xb2; = 58%; <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>); <bold>pooled specificity:</bold> 0.8 (95% CI: 0.8&#x2013;0.9; I&#xb2; = 52%; <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>); <bold>accuracy:</bold> 0.9 (95% CI: 0.8&#x2013;0.9), with pooled <bold>OR</bold> for accuracy = 1.4 (95% CI: 1.2&#x2013;1.7; <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>). Risk differences favored AI by 0.06 (sensitivity) and 0.04 (specificity).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Forest plot of pooled sensitivity (AI vs radiologists).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-15-1634694-g002.tif">
<alt-text content-type="machine-generated">Forest plot comparing AI versus radiologist sensitivity in lung cancer treatment response. The plot includes sensitivity confidence intervals for multiple studies, with a pooled estimate displayed as a diamond shape, indicating variability across studies. Sensitivity values range from 0.5 to 1.0.</alt-text>
</graphic>
</fig>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Forest plot of pooled specificity (AI vs radiologists).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-15-1634694-g003.tif">
<alt-text content-type="machine-generated">Forest plot comparing AI and radiologist specificity in lung cancer treatment response. Horizontal lines represent different studies with names like Hyewon Chol and Oliver Grosvent on the left. Specificity is plotted on the x-axis from 0.6 to 1.0. A pooled estimate is shown at the bottom with a diamond shape, indicating a specificity of 0.82 and a 95 percent confidence interval of 0.77 to 0.88.</alt-text>
</graphic>
</fig>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Forest plot of pooled accuracy (AI vs radiologists).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fonc-15-1634694-g004.tif">
<alt-text content-type="machine-generated">Forest plot comparing AI to radiologist accuracy in assessing lung cancer treatment response. Each horizontal line represents a study, showing a 95% confidence interval for AI's accuracy. A diamond below aggregates the data, indicating pooled accuracy. The horizontal axis ranges from 0.7 to 1.0 accuracy.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3_3">
<title>Subgroup analysis by imaging modality</title>
<p>AI&#x2019;s advantage was most pronounced in <bold>PET/CT</bold> and <bold>CT</bold> subgroups; <bold>MRI</bold> showed smaller/non-significant gains. See <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Performance metrics by study.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Study</th>
<th valign="middle" align="left">Sensitivity (%)</th>
<th valign="middle" align="left">Specificity (%)</th>
<th valign="middle" align="left">Accuracy (%)</th>
<th valign="middle" align="left">AUC</th>
<th valign="middle" align="left">Notes</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">Sarah A (Radiomics)</td>
<td valign="middle" align="left">85 (vs Rad 70)</td>
<td valign="middle" align="left">84 (vs Rad 77)</td>
<td valign="middle" align="left">84 (vs Rad 74)</td>
<td valign="middle" align="left">0.91</td>
<td valign="middle" align="left">Tumor + peri-consolidative regions</td>
</tr>
<tr>
<td valign="middle" align="left">Tu, Wei, et&#xa0;al. (M1/M2/M3)</td>
<td valign="middle" align="left">91/88/84</td>
<td valign="middle" align="left">88/75/94</td>
<td valign="middle" align="left">90/81/89</td>
<td valign="middle" align="left">0.98/0.93/0.94</td>
<td valign="middle" align="left">CT; logistic models</td>
</tr>
<tr>
<td valign="middle" align="left">Hawkins, et&#xa0;al.</td>
<td valign="middle" align="left">83 (67&#x2013;100)</td>
<td valign="middle" align="left">75 (67&#x2013;87)</td>
<td valign="middle" align="left">80</td>
<td valign="middle" align="left">0.86 (0.78&#x2013;0.92)</td>
<td valign="middle" align="left">CT; entire tumor segmented</td>
</tr>
<tr>
<td valign="middle" align="left">MacMahon, Heber, et&#xa0;al.</td>
<td valign="middle" align="left">83 (model)</td>
<td valign="middle" align="left">75 (model)</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">Radiologists outperformed the risk model in some subsets</td>
</tr>
<tr>
<td valign="middle" align="left">Xia, L, et&#xa0;al. (ExtraTrees)</td>
<td valign="middle" align="left">58 (train), 79 (val)</td>
<td valign="middle" align="left">100 (train), 66 (val)</td>
<td valign="middle" align="left">80 (train), 71 (val)</td>
<td valign="middle" align="left">0.94 (train), 0.79 (val)</td>
<td valign="middle" align="left">WSI (histopathology)</td>
</tr>
<tr>
<td valign="middle" align="left">Chen NB, et&#xa0;al. (SVM+IFSMT)</td>
<td valign="middle" align="left">90 (train), 83 (val)</td>
<td valign="middle" align="left">95 (train), 93 (val)</td>
<td valign="middle" align="left">93 (train), 86 (val)</td>
<td valign="middle" align="left">0.97 (train), 0.87 (val)</td>
<td valign="middle" align="left">CT</td>
</tr>
<tr>
<td valign="middle" align="left">Lin, Miaomiao, et&#xa0;al. (GPTV)</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">89 (train), 80 (int val), 79 (ext val)</td>
<td valign="middle" align="left">0.95/0.84/0.82</td>
<td valign="middle" align="left">CT; GTV/PTV/GPTV</td>
</tr>
<tr>
<td valign="middle" align="left">Deng, Kexue, et&#xa0;al. (ESBP)</td>
<td valign="middle" align="left">75/85/55</td>
<td valign="middle" align="left">98/77/98</td>
<td valign="middle" align="left">89/80/79</td>
<td valign="middle" align="left">0.95/0.84/0.82</td>
<td valign="middle" align="left">CT; EGFR-TKI/ICI</td>
</tr>
<tr>
<td valign="middle" align="left">Yoo, Jang, et&#xa0;al.</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">ML 0.85&#x2013;0.86; Physicians 0.76</td>
<td valign="middle" align="left">PET/CT; physician performance improved with ML</td>
</tr>
<tr>
<td valign="middle" align="left">Gevaert, Olivier, et&#xa0;al.</td>
<td valign="middle" align="left">86 (ML) vs 75 (Phys)</td>
<td valign="middle" align="left">71&#x2013;73 (ML) vs 80 (Phys)</td>
<td valign="middle" align="left">80&#x2013;81 (ML) vs 77 (Phys)</td>
<td valign="middle" align="left">0.85&#x2013;0.86 (ML) vs 0.76 (Phys)</td>
<td valign="middle" align="left">CT</td>
</tr>
<tr>
<td valign="middle" align="left">Choi, Hyewon, et&#xa0;al.</td>
<td valign="middle" align="left">94 (high-sens setting)</td>
<td valign="middle" align="left">31</td>
<td valign="middle" align="left">NR</td>
<td valign="middle" align="left">0.75 (0.67&#x2013;0.84)</td>
<td valign="middle" align="left">CT; readers 0.73&#x2013;0.79</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>NR, Not reported.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>Sensitivity analysis, threshold effect, and publication bias.</p>
<p>Leave-one-out analyses showed consistent pooled effects, indicating robustness. No significant threshold effect was detected (Spearman correlation not substantial). Egger&#x2019;s test revealed no significant small-study effects for sensitivity, specificity, or accuracy (e.g., overall p = 0.21). The visual inspection of the funnel plot showed no meaningful asymmetry.</p>
</sec>
<sec id="s3_4">
<title>PRISMA flow</title>
<p>
<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>. PRISMA flow diagram of study selection.</p>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<title>Discussion</title>
<p>This meta-analysis demonstrates that artificial intelligence models achieve statistically significant, albeit modest, superiority over radiologists in predicting lung cancer treatment response, with pooled sensitivity and specificity improvements of 6% and 4%, respectively. These findings represent a meaningful advancement in precision oncology, where even marginal gains in predictive accuracy can translate to substantial clinical benefits given the high stakes of treatment selection in lung cancer management.</p>
<p>The observed performance advantage was most pronounced in PET and CT imaging, modalities that form the cornerstone of treatment response evaluation in current clinical practice (<xref ref-type="bibr" rid="B19">19</xref>). This modality-specific superiority likely reflects the inherent characteristics of these imaging techniques and their alignment with AI pattern recognition capabilities. PET imaging&#x2019;s quantitative metabolic information provides rich data for machine learning algorithms to identify subtle changes in tumor glucose uptake that may precede morphological changes detectable by human interpretation. Similarly, CT&#x2019;s high spatial resolution and standardized acquisition protocols create consistent datasets that facilitate robust AI model training and validation. In contrast, MRI-only analyses did not show a statistically significant AI advantage in our pooled results, underscoring the need for modality-specific validation.</p>
<p>The predominance of convolutional neural network (CNN)-based architectures among the evaluated AI systems aligns with the established superiority of deep learning approaches in medical image analysis (<xref ref-type="bibr" rid="B20">20</xref>). CNNs excel at hierarchical feature extraction, automatically identifying complex patterns across multiple scales that may escape human perception. However, the absence of regulatory approval for any evaluated systems highlights a critical gap between research innovation and clinical translation (<xref ref-type="bibr" rid="B21">21</xref>). This regulatory void raises fundamental questions about quality assurance, liability frameworks, and reimbursement mechanisms that must be addressed before widespread clinical adoption.</p>
<p>The clinical implications of AI-assisted treatment response prediction extend beyond diagnostic accuracy to encompass broader aspects of personalized cancer care. Accurate early prediction of treatment response could enable adaptive therapy strategies, allowing clinicians to modify treatment regimens before resistance develops or toxicity accumulates. This paradigm shift from reactive to proactive treatment management represents a fundamental evolution in oncological practice, potentially improving both survival outcomes and quality of life for patients with lung cancer.</p>
<p>However, integrating AI into clinical decision-making workflows presents complex challenges that transcend technical performance metrics. The &#x201c;black box&#x201d; nature of deep learning models creates interpretability barriers that may impede clinician acceptance and patient trust. While several studies incorporated explainable AI methods such as Gradient-weighted Class Activation Mapping (Grad-CAM), none systematically evaluated their impact on clinical decision-making or patient outcomes (<xref ref-type="bibr" rid="B22">22</xref>). Complementary frameworks such as SHAP can also clarify feature contributions (e.g., tumor texture, volume, or metabolic intensity), and embedding these explanations into reporting/PACS could facilitate human AI collaboration in practice (<xref ref-type="bibr" rid="B23">23</xref>).</p>
<p>The demographic homogeneity observed across the included studies raises essential questions about AI generalizability and health equity (<xref ref-type="bibr" rid="B24">24</xref>). The underrepresentation of diverse patient populations in training datasets may perpetuate healthcare disparities, as AI models may perform suboptimally in underrepresented groups which is constant in other studies as well. This concern is particularly relevant in lung cancer, where significant racial and socioeconomic disparities in outcomes already exist. Ensuring equitable AI performance across diverse populations will require deliberate efforts to include representative datasets and conduct subgroup analyses during model development and validation.</p>
<p>Economic considerations represent another critical dimension of AI implementation that remains largely unexplored in the current literature (<xref ref-type="bibr" rid="B25">25</xref>). While the direct costs of AI systems are substantial, encompassing software licensing, hardware infrastructure, and integration expenses, the potential for cost savings through improved treatment selection and reduced unnecessary interventions may justify these investments. The economic burden of lung cancer treatment, exceeding $21 billion annually in the United States, suggests that even modest improvements in treatment response prediction could yield significant healthcare savings through optimized resource allocation and reduced treatment failures. Formal cost-effectiveness analyses were not reported across the included studies and should be incorporated prospectively.</p>
<p>The heterogeneity observed across studies in AI architectures, training methodologies, and validation approaches reflects the nascent state of the field and the absence of standardized evaluation frameworks. This variability complicates direct comparisons between AI systems and may contribute to the moderate statistical heterogeneity observed in our meta-analysis (I&#xb2; values in the mild range). We found no evidence of a threshold effect based on Spearman&#x2019;s correlation, and leave-one-out sensitivity analyses did not materially change the pooled estimates, supporting the robustness of the findings. Funnel plot symmetry and Egger&#x2019;s test were consistent with a low likelihood of publication bias (p = 0.21), although selective reporting cannot be entirely excluded. Potential overlap of patient cohorts from the same institutions could not be wholly resolved and may have modestly inflated pooled sample size estimates. Finally, the protocol for this review was not prospectively registered, which introduces some risk of reporting bias despite our PRISMA-guided methods.</p>
<p>The temporal dynamics of treatment response prediction present additional complexity that warrants consideration. Traditional imaging-based response assessment typically occurs at predetermined intervals, often weeks to months after treatment initiation. AI models capable of earlier response prediction could enable more timely treatment modifications, potentially improving outcomes while minimizing exposure to ineffective therapies. However, the optimal timing for AI-assisted response prediction and its integration with existing clinical protocols requires further investigation.</p>
<p>Future research should prioritize prospective, multicenter validation studies that address the limitations identified in this meta-analysis. Such studies should incorporate diverse patient populations, standardized imaging protocols, and comprehensive economic evaluations to provide robust evidence for clinical implementation. Additionally, the development of hybrid human-AI decision support systems that leverage the complementary strengths of both approaches may offer superior performance compared to either modality alone. The findings of this meta-analysis position AI as a promising adjunct to radiologist interpretation rather than a replacement technology (<xref ref-type="bibr" rid="B26">26</xref>). The modest but consistent performance improvements observed across multiple studies suggest that AI can enhance human expertise while preserving the critical role of clinical judgment in cancer care. This collaborative approach may optimize the benefits of both human experience and machine precision, ultimately improving patient outcomes through more accurate and timely treatment response prediction.</p>
</sec>
<sec id="s5">
<title>Strengths and limitations</title>
<p>This meta-analysis provides one of the most comprehensive evaluations comparing artificial intelligence (AI) and radiologist performance in predicting lung cancer treatment response. Key strengths include a large pooled sample size of 6,615 patients across 11 independent studies, which confers strong statistical power. The methodology adhered to PRISMA 2020 guidelines, incorporating a multi-database search strategy (PubMed, Embase, Scopus, Web of Science, and Cochrane Library) with clearly defined inclusion criteria. Multiple diagnostic performance metrics (sensitivity, specificity, accuracy, and risk difference) were analyzed using standardized statistical models in RevMan, with transparent visualization through forest plots. Independent dual-reviewer screening and data extraction enhanced methodological reliability, with inter-rater agreement quantified (Cohen&#x2019;s &#x3ba; = 0.84). In addition, subgroup analyses by imaging modality (CT, PET, MRI) and clinical context (e.g., advanced disease, EGFR-targeted therapy) provided clinically relevant insights.</p>
<p>Several limitations should also be acknowledged. First, the predominance of retrospective designs (10 of 11 studies) increases susceptibility to selection bias and limits external validity. Second, potential population overlap between studies from the same institutions could not be fully resolved due to limited reporting, potentially inflating pooled sample sizes. Third, heterogeneity in imaging modalities, AI architectures, and &#x201c;treatment response&#x201d; definitions may affect comparability and introduce threshold effects. Fourth, incomplete demographic reporting across studies limits assessment of equity and generalizability to diverse patient populations. Fifth, none of the included AI systems had regulatory clearance, restricting immediate clinical applicability. Sixth, cost-effectiveness analyses were absent, despite economic feasibility being critical for adoption in resource-limited healthcare systems. Seventh, interpretability tools were rarely incorporated, with limited application of explainable AI approaches such as Grad-CAM or SHAP. Finally, while efforts were made to minimize reporting bias, publication bias remains possible due to underreporting negative or neutral findings.</p>
</sec>
<sec id="s6" sec-type="conclusions">
<title>Conclusion</title>
<p>This meta-analysis demonstrates that AI models achieve modest but statistically significant superiority over radiologists in predicting lung cancer treatment response, with pooled gains in sensitivity and accuracy, particularly in CT and PET imaging and in subgroups with advanced disease or EGFR-targeted therapy. These findings highlight AI&#x2019;s potential as a valuable adjunct to human expertise, capable of enhancing diagnostic precision while maintaining comparable specificity and safety.</p>
<p>However, the predominance of retrospective studies, incomplete demographic reporting, heterogeneity in AI architectures, and lack of regulatory clearance limit the immediate generalizability of these results. Furthermore, few studies have incorporated explainable AI methods or assessed cost-effectiveness, which are factors critical for clinical adoption.</p>
<p>Future research should prioritize large-scale, multicenter, prospective trials that evaluate AI in real-world workflows, incorporate transparent and interpretable algorithms, assess equity across diverse populations, and address economic feasibility. AI integration should be conceptualized as augmenting, not replacing, radiologist judgment, fostering a multidisciplinary, patient-centered approach to lung cancer care. Additionally, the MRI-only subgroup did not show a significant AI advantage, and publication bias appeared unlikely based on Egger&#x2019;s test (p = 0.21).</p>
</sec>
</body>
<back>
<sec id="s7" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>. Further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s8" sec-type="author-contributions">
<title>Author contributions</title>
<p>NR: Project administration, Software, Data curation, Methodology, Visualization, Formal Analysis, Investigation, Writing &#x2013; review &amp; editing, Writing &#x2013; original draft, Conceptualization. NM: Writing &#x2013; review &amp; editing, Writing &#x2013; original draft, Methodology, Investigation. KP: Writing &#x2013; original draft, Writing &#x2013; review &amp; editing, Methodology, Data curation. RK: Data curation, Project administration, Writing &#x2013; original draft, Investigation, Supervision, Writing &#x2013; review &amp; editing.</p>
</sec>
<sec id="s9" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare that no financial support was received for the research and/or publication of this article.</p>
</sec>
<sec id="s10" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s11" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec id="s12" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s13" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fonc.2025.1634694/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fonc.2025.1634694/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Table1.pdf" id="SM1" mimetype="application/pdf">
<label>Supplementary Table&#xa0;1</label>
<caption>
<p>Full database-specific search strategies (through March 31, 2025).</p>
</caption>
</supplementary-material>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sung</surname> <given-names>H</given-names>
</name>
<name>
<surname>Ferlay</surname> <given-names>J</given-names>
</name>
<name>
<surname>Siegel</surname> <given-names>RL</given-names>
</name>
<name>
<surname>Laversanne</surname> <given-names>M</given-names>
</name>
<name>
<surname>Soerjomataram</surname> <given-names>I</given-names>
</name>
<name>
<surname>Jemal</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Global cancer statistics 2020: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries</article-title>. <source>CA Cancer J Clin</source>. (<year>2021</year>) <volume>71</volume>:<page-range>209&#x2013;49</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.3322/caac.21660</pub-id>, PMID: <pub-id pub-id-type="pmid">33538338</pub-id></citation></ref>
<ref id="B2">
<label>2</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Herbst</surname> <given-names>RS</given-names>
</name>
<name>
<surname>Morgensztern</surname> <given-names>D</given-names>
</name>
<name>
<surname>Boshoff</surname> <given-names>C</given-names>
</name>
</person-group>. <article-title>The biology and management of non&#x2013;small cell lung cancer</article-title>. <source>Nature</source>. (<year>2018</year>) <volume>553</volume>:<page-range>446&#x2013;54</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nature25183</pub-id>, PMID: <pub-id pub-id-type="pmid">29364287</pub-id></citation></ref>
<ref id="B3">
<label>3</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mok</surname> <given-names>TS</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>YL</given-names>
</name>
<name>
<surname>Kudaba</surname> <given-names>I</given-names>
</name>
<name>
<surname>Kowalski</surname> <given-names>DM</given-names>
</name>
<name>
<surname>Cho</surname> <given-names>BC</given-names>
</name>
<name>
<surname>Turna</surname> <given-names>HZ</given-names>
</name>
<etal/>
</person-group>. <article-title>Pembrolizumab versus chemotherapy for previously untreated, PD-L1&#x2013;expressing, locally advanced or metastatic NSCLC (KEYNOTE-042): a randomised, open-label, controlled, phase 3 trial</article-title>. <source>Lancet</source>. (<year>2019</year>) <volume>393</volume>:<page-range>1819&#x2013;30</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0140-6736(18)32409-7</pub-id>, PMID: <pub-id pub-id-type="pmid">30955977</pub-id></citation></ref>
<ref id="B4">
<label>4</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Eisenhauer</surname> <given-names>EA</given-names>
</name>
<name>
<surname>Therasse</surname> <given-names>P</given-names>
</name>
<name>
<surname>Bogaerts</surname> <given-names>J</given-names>
</name>
<name>
<surname>Schwartz</surname> <given-names>LH</given-names>
</name>
<name>
<surname>Sargent</surname> <given-names>D</given-names>
</name>
<name>
<surname>Ford</surname> <given-names>R</given-names>
</name>
<etal/>
</person-group>. <article-title>New response evaluation criteria in solid tumours: revised RECIST guideline (version 1.1)</article-title>. <source>Eur J Cancer</source>. (<year>2009</year>) <volume>45</volume>:<page-range>228&#x2013;47</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ejca.2008.10.026</pub-id>, PMID: <pub-id pub-id-type="pmid">19097774</pub-id></citation></ref>
<ref id="B5">
<label>5</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nishino</surname> <given-names>M</given-names>
</name>
<name>
<surname>Jagannathan</surname> <given-names>JP</given-names>
</name>
<name>
<surname>Krajewski</surname> <given-names>KM</given-names>
</name>
<name>
<surname>O&#x2019;Regan</surname> <given-names>KN</given-names>
</name>
<name>
<surname>Hatabu</surname> <given-names>H</given-names>
</name>
<name>
<surname>Shapiro</surname> <given-names>G</given-names>
</name>
<etal/>
</person-group>. <article-title>Personalized tumor response assessment in the era of molecular medicine: cancer-specific and therapy-specific response criteria to complement RECIST</article-title>. <source>AJR Am J Roentgenol</source>. (<year>2012</year>) <volume>198</volume>:<page-range>737&#x2013;45</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.2214/AJR.11.7630</pub-id>, PMID: <pub-id pub-id-type="pmid">22451534</pub-id></citation></ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Oxnard</surname> <given-names>GR</given-names>
</name>
<name>
<surname>Pao</surname> <given-names>W</given-names>
</name>
</person-group>. <article-title>RECIST response: Malignant pleural mesothelioma and beyond</article-title>. <source>Clin Cancer Res</source>. (<year>2012</year>) <volume>18</volume>:<page-range>4471&#x2013;3</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1158/1078-0432.CCR-12-1981</pub-id>
</citation></ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lambin</surname> <given-names>P</given-names>
</name>
<name>
<surname>Leijenaar</surname> <given-names>RTH</given-names>
</name>
<name>
<surname>Deist</surname> <given-names>TM</given-names>
</name>
<name>
<surname>Peerlings</surname> <given-names>J</given-names>
</name>
<name>
<surname>de Jong</surname> <given-names>EEC</given-names>
</name>
<name>
<surname>van Timmeren</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Radiomics: the bridge between medical imaging and personalized medicine</article-title>. <source>Nat Rev Clin Oncol</source>. (<year>2017</year>) <volume>14</volume>:<page-range>749&#x2013;62</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nrclinonc.2017.141</pub-id>, PMID: <pub-id pub-id-type="pmid">28975929</pub-id></citation></ref>
<ref id="B8">
<label>8</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ardila</surname> <given-names>D</given-names>
</name>
<name>
<surname>Kiraly</surname> <given-names>AP</given-names>
</name>
<name>
<surname>Bharadwaj</surname> <given-names>S</given-names>
</name>
<name>
<surname>Choi</surname> <given-names>B</given-names>
</name>
<name>
<surname>Reicher</surname> <given-names>JJ</given-names>
</name>
<name>
<surname>Peng</surname> <given-names>L</given-names>
</name>
<etal/>
</person-group>. <article-title>End-to-end lung cancer screening with 3D deep learning on low-dose CT</article-title>. <source>Nat Med</source>. (<year>2019</year>) <volume>25</volume>:<page-range>954&#x2013;61</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41591-019-0447-x</pub-id>, PMID: <pub-id pub-id-type="pmid">31110349</pub-id></citation></ref>
<ref id="B9">
<label>9</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hosny</surname> <given-names>A</given-names>
</name>
<name>
<surname>Parmar</surname> <given-names>C</given-names>
</name>
<name>
<surname>Quackenbush</surname> <given-names>J</given-names>
</name>
<name>
<surname>Schwartz</surname> <given-names>LH</given-names>
</name>
<name>
<surname>Aerts</surname> <given-names>HJWL</given-names>
</name>
</person-group>. <article-title>Artificial intelligence in radiology</article-title>. <source>Nat Rev Cancer</source>. (<year>2018</year>) <volume>18</volume>:<page-range>500&#x2013;10</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41568-018-0016-5</pub-id>, PMID: <pub-id pub-id-type="pmid">29777175</pub-id></citation></ref>
<ref id="B10">
<label>10</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Van Timmeren</surname> <given-names>JE</given-names>
</name>
<name>
<surname>Cester</surname> <given-names>D</given-names>
</name>
<name>
<surname>Tanadini-Lang</surname> <given-names>S</given-names>
</name>
<name>
<surname>Alkadhi</surname> <given-names>H</given-names>
</name>
<name>
<surname>Baessler</surname> <given-names>B</given-names>
</name>
</person-group>. <article-title>Radiomics in medical imaging&#x2014;&#x201d;how-to&#x201d; guide and critical reflection</article-title>. <source>Insights Imaging</source>. (<year>2020</year>) <volume>11</volume>:<fpage>91</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13244-020-00887-2</pub-id>, PMID: <pub-id pub-id-type="pmid">32785796</pub-id></citation></ref>
<ref id="B11">
<label>11</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Page</surname> <given-names>MJ</given-names>
</name>
<name>
<surname>McKenzie</surname> <given-names>JE</given-names>
</name>
<name>
<surname>Bossuyt</surname> <given-names>PM</given-names>
</name>
<name>
<surname>Boutron</surname> <given-names>I</given-names>
</name>
<name>
<surname>Hoffmann</surname> <given-names>TC</given-names>
</name>
<name>
<surname>Mulrow</surname> <given-names>CD</given-names>
</name>
<etal/>
</person-group>. <article-title>The PRISMA 2020 statement: an updated guideline for reporting systematic reviews</article-title>. <source>BMJ</source>. (<year>2021</year>) <volume>372</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmj.n71</pub-id>, PMID: <pub-id pub-id-type="pmid">33782057</pub-id></citation></ref>
<ref id="B12">
<label>12</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cohen</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>A coefficient of agreement for nominal scales</article-title>. <source>Educ Psychol Meas</source>. (<year>1960</year>) <volume>20</volume>:<fpage>37</fpage>&#x2013;<lpage>46</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1177/001316446002000104</pub-id>
</citation></ref>
<ref id="B13">
<label>13</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Whiting</surname> <given-names>PF</given-names>
</name>
<name>
<surname>Rutjes</surname> <given-names>AWS</given-names>
</name>
<name>
<surname>Westwood</surname> <given-names>ME</given-names>
</name>
<name>
<surname>Mallett</surname> <given-names>S</given-names>
</name>
<name>
<surname>Deeks</surname> <given-names>JJ</given-names>
</name>
<name>
<surname>Reitsma</surname> <given-names>JB</given-names>
</name>
<etal/>
</person-group>. <article-title>QUADAS-2: a revised tool for the quality assessment of diagnostic accuracy studies</article-title>. <source>Ann Intern Med</source>. (<year>2011</year>) <volume>155</volume>:<page-range>529&#x2013;36</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.7326/0003-4819-155-8-201110180-00009</pub-id>, PMID: <pub-id pub-id-type="pmid">22007046</pub-id></citation></ref>
<ref id="B14">
<label>14</label>
<citation citation-type="book">
<source>Review Manager (RevMan) [Computer program]. Version 5.4</source>. <publisher-loc>Copenhagen</publisher-loc>: <publisher-name>The Cochrane Collaboration</publisher-name> (<year>2020</year>).</citation></ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>DerSimonian</surname> <given-names>R</given-names>
</name>
<name>
<surname>Laird</surname> <given-names>N</given-names>
</name>
</person-group>. <article-title>Meta-analysis in clinical trials</article-title>. <source>Control Clin Trials</source>. (<year>1986</year>) <volume>7</volume>:<page-range>177&#x2013;88</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0197-2456(86)90046-2</pub-id>, PMID: <pub-id pub-id-type="pmid">3802833</pub-id></citation></ref>
<ref id="B16">
<label>16</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Higgins</surname> <given-names>JPT</given-names>
</name>
<name>
<surname>Thompson</surname> <given-names>SG</given-names>
</name>
<name>
<surname>Deeks</surname> <given-names>JJ</given-names>
</name>
<name>
<surname>Altman</surname> <given-names>DG</given-names>
</name>
</person-group>. <article-title>Measuring inconsistency in meta-analyses</article-title>. <source>BMJ</source>. (<year>2003</year>) <volume>327</volume>:<page-range>557&#x2013;60</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmj.327.7414.557</pub-id>, PMID: <pub-id pub-id-type="pmid">12958120</pub-id></citation></ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moses</surname> <given-names>LE</given-names>
</name>
<name>
<surname>Shapiro</surname> <given-names>D</given-names>
</name>
<name>
<surname>Littenberg</surname> <given-names>B</given-names>
</name>
</person-group>. <article-title>Combining independent studies of a diagnostic test into a summary ROC curve: data-analytic approaches and some additional considerations</article-title>. <source>Stat Med</source>. (<year>1993</year>) <volume>12</volume>:<page-range>1293&#x2013;316</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/sim.4780121403</pub-id>, PMID: <pub-id pub-id-type="pmid">8210827</pub-id></citation></ref>
<ref id="B18">
<label>18</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Egger</surname> <given-names>M</given-names>
</name>
<name>
<surname>Davey Smith</surname> <given-names>G</given-names>
</name>
<name>
<surname>Schneider</surname> <given-names>M</given-names>
</name>
<name>
<surname>Minder</surname> <given-names>C</given-names>
</name>
</person-group>. <article-title>Bias in meta-analysis detected by a simple, graphical test</article-title>. <source>BMJ</source>. (<year>1997</year>) <volume>315</volume>:<page-range>629&#x2013;34</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmj.315.7109.629</pub-id>, PMID: <pub-id pub-id-type="pmid">9310563</pub-id></citation></ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Cai</surname> <given-names>W</given-names>
</name>
<name>
<surname>Shao</surname> <given-names>X</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>F</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>PET/CT radiomics for prediction of treatment response in lung cancer: a systematic review and meta-analysis</article-title>. <source>Eur J Nucl Med Mol Imaging</source>. (<year>2021</year>) <volume>48</volume>:<page-range>3651&#x2013;63</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00259-021-05438-3</pub-id>
</citation></ref>
<ref id="B20">
<label>20</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Krizhevsky</surname> <given-names>A</given-names>
</name>
<name>
<surname>Sutskever</surname> <given-names>I</given-names>
</name>
<name>
<surname>Hinton</surname> <given-names>GE</given-names>
</name>
</person-group>. <article-title>ImageNet classification with deep convolutional neural networks</article-title>. <source>Commun ACM</source>. (<year>2017</year>) <volume>60</volume>:<fpage>84</fpage>&#x2013;<lpage>90</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1145/3065386</pub-id>
</citation></ref>
<ref id="B21">
<label>21</label>
<citation citation-type="web">
<person-group person-group-type="author">
<collab>U.S. Food and Drug Administration</collab>
</person-group>. <article-title>Artificial Intelligence and Machine Learning in Software as a Medical Device (SaMD)</article-title> (<year>2024</year>). Available online at: <uri xlink:href="https://www.fda.gov/medical-devices/software-medical-device-samd/artificial-intelligence-and-machine-learning-software-medical-device">https://www.fda.gov/medical-devices/software-medical-device-samd/artificial-intelligence-and-machine-learning-software-medical-device</uri> (Accessed September 17, 2025).</citation></ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Selvaraju</surname> <given-names>RR</given-names>
</name>
<name>
<surname>Cogswell</surname> <given-names>M</given-names>
</name>
<name>
<surname>Das</surname> <given-names>A</given-names>
</name>
<name>
<surname>Vedantam</surname> <given-names>R</given-names>
</name>
<name>
<surname>Parikh</surname> <given-names>D</given-names>
</name>
<name>
<surname>Batra</surname> <given-names>D</given-names>
</name>
</person-group>. <article-title>Grad-CAM: Visual explanations from deep networks via gradient-based localization</article-title>. <source>Int J Comput Vis</source>. (<year>2020</year>) <volume>128</volume>:<page-range>336&#x2013;59</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11263-019-01228-7</pub-id>
</citation></ref>
<ref id="B23">
<label>23</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Lundberg</surname> <given-names>SM</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>SI</given-names>
</name>
</person-group>. <article-title>A unified approach to interpreting model predictions</article-title>. In: <person-group person-group-type="editor">
<name>
<surname>Guyon</surname> <given-names>I</given-names>
</name>
<name>
<surname>Luxburg</surname> <given-names>UV</given-names>
</name>
<name>
<surname>Bengio</surname> <given-names>S</given-names>
</name>
<name>
<surname>Wallach</surname> <given-names>H</given-names>
</name>
<name>
<surname>Fergus</surname> <given-names>R</given-names>
</name>
<name>
<surname>Vishwanathan</surname> <given-names>S</given-names>
</name>
<name>
<surname>Garnett</surname> <given-names>R</given-names>
</name>
</person-group>, editors. <source>Advances in Neural Information Processing Systems 30</source>. <publisher-loc>Red Hook, New York, USA</publisher-loc>: <publisher-name>Curran Associates, Inc</publisher-name> (<year>2017</year>). p. <page-range>4765&#x2013;74</page-range>.</citation></ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>IY</given-names>
</name>
<name>
<surname>Szolovits</surname> <given-names>P</given-names>
</name>
<name>
<surname>Ghassemi</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Can AI help reduce disparities in general medical and mental health care</article-title>? <source>AMA J Ethics</source>. (<year>2019</year>) <volume>21</volume>:<page-range>E167&#x2013;79</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1001/amajethics.2019.167</pub-id>, PMID: <pub-id pub-id-type="pmid">30794127</pub-id></citation></ref>
<ref id="B25">
<label>25</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chilamkurthy</surname> <given-names>S</given-names>
</name>
<name>
<surname>Ghosh</surname> <given-names>R</given-names>
</name>
<name>
<surname>Tanamala</surname> <given-names>S</given-names>
</name>
<name>
<surname>Biviji</surname> <given-names>M</given-names>
</name>
<name>
<surname>Campeau</surname> <given-names>NG</given-names>
</name>
<name>
<surname>Venugopal</surname> <given-names>VK</given-names>
</name>
<etal/>
</person-group>. <article-title>Deep learning algorithms for detecting critical findings in head CT scans: a retrospective study</article-title>. <source>Lancet</source>. (<year>2018</year>) <volume>392</volume>:<page-range>2388&#x2013;96</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0140-6736(18)31645-3</pub-id>, PMID: <pub-id pub-id-type="pmid">30318264</pub-id></citation></ref>
<ref id="B26">
<label>26</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tu</surname> <given-names>W</given-names>
</name>
<name>
<surname>Li</surname> <given-names>H</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>S</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>X</given-names>
</name>
<etal/>
</person-group>. <article-title>Predictive performance of artificial intelligence on CT imaging in lung cancer: a systematic review and meta-analysis</article-title>. <source>Transl Lung Cancer Res</source>. (<year>2022</year>) <volume>11</volume>:<fpage>798</fpage>&#x2013;<lpage>809</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.21037/tlcr-21-1012</pub-id>, PMID: <pub-id pub-id-type="pmid">35832457</pub-id></citation></ref>
</ref-list>
</back>
</article>