<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="discussion" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Oncol.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Oncology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Oncol.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2234-943X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fonc.2026.1730967</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Opinion</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Critical considerations for the use of deep learning models in clinical oncology prediction</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Zhao</surname><given-names>Daren</given-names></name>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2634448/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project-administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
</contrib-group>
<aff id="aff1"><institution>Faculty of Social Sciences and Humanities, Mahidol University</institution>, <city>Salaya</city>, <state>Nakhon Pathom</state>,&#xa0;<country country="th">Thailand</country></aff>
<author-notes>
<corresp id="c001"><label>*</label>Correspondence: Daren Zhao, <email xlink:href="mailto:cdzhaodaren@163.com">cdzhaodaren@163.com</email>; <email xlink:href="mailto:daren.zha@student.mahidol.ac.th">daren.zha@student.mahidol.ac.th</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-24">
<day>24</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>16</volume>
<elocation-id>1730967</elocation-id>
<history>
<date date-type="received">
<day>23</day>
<month>10</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>09</day>
<month>02</month>
<year>2026</year>
</date>
<date date-type="rev-recd">
<day>07</day>
<month>02</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Zhao.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Zhao</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-24">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<kwd-group>
<kwd>breast cancer</kwd>
<kwd>clinical prediction models</kwd>
<kwd>clinical research</kwd>
<kwd>deep learning models</kwd>
<kwd>generalizability</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was not received for this work and/or its publication.</funding-statement>
</funding-group>
<counts>
<fig-count count="0"/>
<table-count count="0"/>
<equation-count count="0"/>
<ref-count count="10"/>
<page-count count="3"/>
<word-count count="982"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Breast Cancer</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<p>In a recent study on clinical prediction models, Liu (<xref ref-type="bibr" rid="B1">1</xref>) and colleagues developed a deep learning model to predict ALN pCR in ALN-positive breast cancer patients undergoing NAT by analyzing longitudinal ultrasound images of the primary tumor and ALNs. Their findings provide an evidence-based rationale for omitting unnecessary axillary lymph node dissection. This study serves as a representative case of clinical prediction modeling in oncology research, with its preliminary results indicating promising potential for clinical translation. However, it is imperative for us to acknowledge that a critical gap remains between the technical development of prediction models and their practical application in real-world clinical decision-making. We think that these challenges reflect common issues widely encountered by researchers in implementing clinical prediction models, which urgently require recognition and deep analysis.</p>
<p>First and foremost, comprehensive analysis and reporting of the limitations of prediction models serve as an essential foundation for adhering to clinical prediction model guidelines and establishing model transparency and credibility (<xref ref-type="bibr" rid="B2">2</xref>). One of the core challenges faced by clinical prediction models lies in ensuring that their development and reporting strictly comply with established clinical prediction model guidelines, which is the primary prerequisite for realizing their clinical translation value.</p>
<p>However, in this study, the reporting of the model&#x2019;s limitations may not be comprehensive. The authors focused only on the inherent shortcomings of deep learning models, specifically their lack of interpretability due to the &#x201c;black box&#x201d; nature, while overlooking other important issues that should be addressed in model interpretation. For example, a key and common limitation of deep learning models is their sensitivity to noise and outliers (<xref ref-type="bibr" rid="B3">3</xref>). In real and complex clinical environments, the iShape model could be affected by various sources of &#x201c;noise,&#x201d; including technical parameters of equipment, biological and phenotypic heterogeneity across populations, and differences in the standardization of clinical procedures. This sensitivity to noise, if not adequately accounted for, may lead to serious clinical consequences. For instance, in breast cancer diagnosis, it could result in misjudgment of lymph node metastasis status, thereby increasing the risk of inappropriately omitting necessary axillary surgery. These noise factors are directly related to whether the model can be reliably applied in actual clinical practice. Although the model demonstrated excellent performance in the study, its methodology lacks sufficient discussion and analysis of how these potential noise sources are addressed.</p>
<p>Therefore, we strongly recommend that researchers developing and reporting machine learning prediction models in the biomedical field strictly adhere to relevant guidelines (<xref ref-type="bibr" rid="B2">2</xref>, <xref ref-type="bibr" rid="B4">4</xref>) to achieve standardization in the reporting of clinical prediction models. In particular, it is essential to provide objective reporting and analysis of the clinical significance and limitations of prediction models, as this is key to establishing reliable clinical prediction models.</p>
<p>Secondly, on the basis of standardized reporting for clinical prediction models, only by further improving the generalization ability of the models and systematically evaluating their inherent limitations can related research truly possess clinical guiding significance. This requires the implementation of a rigorous validation process before a model is put into clinical use: continuously selecting the optimal model, conducting long-term testing of its robustness and generalization ability, and ultimately validating its effectiveness in real-world clinical settings (<xref ref-type="bibr" rid="B5">5</xref>). Therefore, the generalization ability and stability of a model are decisive factors in achieving clinical translation.</p>
<p>However, the generalization capability and stability of a model depend on several key factors, including its applicability, sample size (<xref ref-type="bibr" rid="B6">6</xref>), and population heterogeneity. In this study, the authors did not thoroughly explore the potential impact of sample size and cohort heterogeneity on the performance of the iShape model. For example, the study trained the model using data from only 371 patients, which may be an insufficient sample size and could affect its stability in real&#x2212;world applications. Furthermore, in terms of population representativeness, while the training data integrated information from two hospitals in northern and southern regions, the external validation was conducted solely on data from three hospitals in the south. This results in inadequate diversity in geography and demographics in the external validation cohort, which may weaken the model&#x2019;s generalizability. Although the authors mentioned in the limitations section that large&#x2212;scale prospective studies are needed in the future, how to systematically address the above heterogeneity challenges remains a critical practical difficulty in implementation.</p>
<p>Therefore, we recommend that future studies should build sufficiently large and adequately diversified training datasets based on clearer clinical objectives, in order to meet the basic data requirements of deep learning. The datasets should strive to cover geographical and demographic variations within the target population, and incorporate variability from different levels of medical institutions and different models of equipment. This approach can help control key confounding factors at the source and ultimately enhance the model&#x2019;s generalizability and stability. Moreover, external validation should be emphasized, with a focus on evaluating the model&#x2019;s applicability across diverse populations, real-world clinical settings, and in samples of sufficient size (<xref ref-type="bibr" rid="B7">7</xref>&#x2013;<xref ref-type="bibr" rid="B9">9</xref>).</p>
<p>In conclusion, systematic shortcomings in reporting and insufficient robustness are prevalent issues in current clinical prediction model research. Yet, the clinical environment in real-world studies is complex and ever-changing. Consequently, translating prediction models into clinical practice must focus critically on two essential aspects: &#x201c;standardized reporting&#x201d; and &#x201c;rigorous validation.&#x201d; &#x201c;Standardized reporting&#x201d; necessitates addressing all potential limitations of a model, including its algorithmic characteristics and sensitivity to data noise. Meanwhile, &#x201c;rigorous validation&#x201d; requires controlling for key confounding factors and overcoming practical constraints. These include data access limitations, multi-center data harmonization, and the execution of prospective validation studies, all of which necessitate long-term and repeated performance assessments of the model. Therefore, future research should adhere to clinical prediction model development guidelines and prioritize establishing a systematic evaluation framework that integrates both &#x201c;standardized reporting&#x201d; and &#x201c;rigorous validation.&#x201d; This is vital for effectively translating developed prediction models from methodology into clinical practice, transforming them into reliable and practical tools for clinical decision support (<xref ref-type="bibr" rid="B10">10</xref>).</p>
</body>
<back>
<sec id="s1" sec-type="author-contributions">
<title>Author contributions</title>
<p>DZ: Data curation, Supervision, Investigation, Methodology, Conceptualization, Software, Writing &#x2013; review &amp; editing, Resources, Visualization, Project administration, Validation, Funding acquisition, Formal analysis, Writing &#x2013; original draft.</p></sec>
<sec id="s3" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
<sec id="s4" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec id="s5" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Liu</surname> <given-names>Y</given-names></name>
<name><surname>Wang</surname> <given-names>Y</given-names></name>
<name><surname>Huang</surname> <given-names>J</given-names></name>
<name><surname>Pei</surname> <given-names>S</given-names></name>
<name><surname>Wang</surname> <given-names>Y</given-names></name>
<name><surname>Cui</surname> <given-names>Y</given-names></name>
<etal/>
</person-group>. 
<article-title>Deep learning-based prediction of axillary pathological complete response in patients with breast cancer using longitudinal multiregional ultrasound</article-title>. <source>EBioMedicine</source>. (<year>2025</year>) <volume>119</volume>:<elocation-id>105896</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ebiom.2025.105896</pub-id>, PMID: <pub-id pub-id-type="pmid">40876229</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<label>2</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Luo</surname> <given-names>W</given-names></name>
<name><surname>Phung</surname> <given-names>D</given-names></name>
<name><surname>Tran</surname> <given-names>T</given-names></name>
<name><surname>Gupta</surname> <given-names>S</given-names></name>
<name><surname>Rana</surname> <given-names>S</given-names></name>
<name><surname>Karmakar</surname> <given-names>C</given-names></name>
<etal/>
</person-group>. 
<article-title>Guidelines for developing and reporting machine learning predictive models in biomedical research: A multidisciplinary view</article-title>. <source>J Med Internet Res</source>. (<year>2016</year>) <volume>18</volume>:<fpage>e323</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2196/jmir.5870</pub-id>, PMID: <pub-id pub-id-type="pmid">27986644</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<label>3</label>
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>Y</given-names></name>
<name><surname>Ma</surname> <given-names>X</given-names></name>
<name><surname>Chen</surname> <given-names>Z</given-names></name>
<name><surname>Luo</surname> <given-names>Y</given-names></name>
<name><surname>Yi</surname> <given-names>J</given-names></name>
<name><surname>Bailey</surname> <given-names>J.</given-names></name>
</person-group>
<article-title>Symmetric cross entropy for robust learning with noisy labels</article-title>. In: <source>Proceedings of the IEEE/CVF international conference on computer vision</source>. <publisher-loc>Seoul, Korea (South)</publisher-loc>: 
<publisher-name>IEEE</publisher-name> (<year>2019</year>). p. <page-range>322&#x2013;30</page-range>.
</mixed-citation>
</ref>
<ref id="B4">
<label>4</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Efthimiou</surname> <given-names>O</given-names></name>
<name><surname>Seo</surname> <given-names>M</given-names></name>
<name><surname>Chalkou</surname> <given-names>K</given-names></name>
<name><surname>Debray</surname> <given-names>T</given-names></name>
<name><surname>Egger</surname> <given-names>M</given-names></name>
<name><surname>Salanti</surname> <given-names>G</given-names></name>
<etal/>
</person-group>. 
<article-title>Developing clinical prediction models: a step-by-step guide</article-title>. <source>BMJ</source>. (<year>2024</year>) <volume>386</volume>:<fpage>e078276</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmj-2023-078276</pub-id>, PMID: <pub-id pub-id-type="pmid">39227063</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<label>5</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Topol</surname> <given-names>EJ</given-names></name>
</person-group>. 
<article-title>High-performance medicine: the convergence of human and artificial intelligence</article-title>. <source>Nat Med</source>. (<year>2019</year>) <volume>25</volume>:<fpage>44</fpage>&#x2013;<lpage>56</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41591-018-0300-7</pub-id>, PMID: <pub-id pub-id-type="pmid">30617339</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<label>6</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Silvey</surname> <given-names>S</given-names></name>
<name><surname>Liu</surname> <given-names>J</given-names></name>
</person-group>. 
<article-title>Sample size requirements for popular classification algorithms in tabular clinical data: empirical study</article-title>. <source>J Med Internet Res</source>. (<year>2024</year>) <volume>26</volume>:<fpage>e60231</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2196/60231</pub-id>, PMID: <pub-id pub-id-type="pmid">39689306</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<label>7</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Collins</surname> <given-names>GS</given-names></name>
<name><surname>Dhiman</surname> <given-names>P</given-names></name>
<name><surname>Ma</surname> <given-names>J</given-names></name>
<name><surname>Schlussel</surname> <given-names>MM</given-names></name>
<name><surname>Archer</surname> <given-names>L</given-names></name>
<name><surname>Van Calster</surname> <given-names>B</given-names></name>
<etal/>
</person-group>. 
<article-title>Evaluation of clinical prediction models (part 1): from development to external validation</article-title>. <source>BMJ</source>. (<year>2024</year>) <volume>384</volume>:<fpage>e074819</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmj-2023-074819</pub-id>, PMID: <pub-id pub-id-type="pmid">38191193</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<label>8</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Riley</surname> <given-names>RD</given-names></name>
<name><surname>Archer</surname> <given-names>L</given-names></name>
<name><surname>Snell</surname> <given-names>KIE</given-names></name>
<name><surname>Ensor</surname> <given-names>J</given-names></name>
<name><surname>Dhiman</surname> <given-names>P</given-names></name>
<name><surname>Martin</surname> <given-names>GP</given-names></name>
<etal/>
</person-group>. 
<article-title>Evaluation of clinical prediction models (part 2): how to undertake an external validation study</article-title>. <source>BMJ</source>. (<year>2024</year>) <volume>384</volume>:<fpage>e074820</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmj-2023-074820</pub-id>, PMID: <pub-id pub-id-type="pmid">38224968</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<label>9</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Riley</surname> <given-names>RD</given-names></name>
<name><surname>Snell</surname> <given-names>KIE</given-names></name>
<name><surname>Archer</surname> <given-names>L</given-names></name>
<name><surname>Ensor</surname> <given-names>J</given-names></name>
<name><surname>Debray</surname> <given-names>TPA</given-names></name>
<name><surname>van Calster</surname> <given-names>B</given-names></name>
<etal/>
</person-group>. 
<article-title>Evaluation of clinical prediction models (part 3): calculating the sample size required for an external validation study</article-title>. <source>BMJ</source>. (<year>2024</year>) <volume>384</volume>:<fpage>e074821</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmj-2023-074821</pub-id>, PMID: <pub-id pub-id-type="pmid">38253388</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<label>10</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhao</surname> <given-names>D</given-names></name>
</person-group>. 
<article-title>ALSFRS-R forecasting: A reliable clinical tool? A translational challenge</article-title>. <source>Eur J Clin Invest</source>. (<year>2026</year>) <volume>56</volume>:<fpage>e70178</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/eci.70178</pub-id>, PMID: <pub-id pub-id-type="pmid">41567083</pub-id>
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn id="n1" fn-type="custom" custom-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/618108">Shuoyu Xu</ext-link>, Bio-totem Pte Ltd, China</p></fn>
<fn id="n2" fn-type="custom" custom-type="reviewed-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2258794">Balu Bhasuran</ext-link>, Florida State University, United States</p></fn>
</fn-group>
</back>
</article>